framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,power_law_1.01,0.1356287956237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,power_law_1.2,0.13388160467147828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,power_law_1.01,0.2038719892501831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,power_law_1.2,0.18220160007476807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,power_law_1.01,0.24848639965057373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,power_law_1.2,0.23586559295654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,power_law_1.01,0.4338496208190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,power_law_1.2,0.4338240146636963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,power_law_1.01,0.44164481163024905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,power_law_1.2,0.4412735939025879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,power_law_1.01,0.4481919765472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,power_law_1.2,0.4482431888580322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,power_law_1.01,0.4502399921417236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,power_law_1.2,0.4515200138092041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,power_law_1.01,0.4428736209869385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,power_law_1.2,0.4523263931274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,power_law_1.01,0.4559807777404785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,power_law_1.2,0.4539648056030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,power_law_1.01,0.4551551818847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,power_law_1.2,0.4560256004333496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,power_law_1.01,0.48546562194824217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,power_law_1.2,0.46790399551391604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,power_law_1.01,0.48874878883361816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,power_law_1.2,0.48510079383850097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,power_law_1.01,0.4973504066467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,power_law_1.2,0.48917760848999026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,power_law_1.01,0.5219200134277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,power_law_1.2,0.5289023876190185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,power_law_1.01,0.559603214263916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,power_law_1.2,0.5707071781158447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,power_law_1.01,0.5784448146820068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,power_law_1.2,0.6010240077972412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,power_law_1.01,0.6190080165863037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,power_law_1.2,0.6083903789520264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,power_law_1.01,0.7199679851531983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,power_law_1.2,0.7212351799011231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,power_law_1.01,0.8567680358886719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,power_law_1.2,0.8793600082397461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,power_law_1.01,1.1023167610168456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,power_law_1.2,1.1375871658325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,power_law_1.01,1.3656959533691406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,power_law_1.2,1.3645055770874024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,power_law_1.01,1.9182336807250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,power_law_1.2,1.936729621887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,power_law_1.01,2.366969680786133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,power_law_1.2,2.3719167709350586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,power_law_1.01,3.3926017761230467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,power_law_1.2,3.52740478515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,power_law_1.01,4.720307159423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,power_law_1.2,4.805132675170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,power_law_1.01,7.147609710693359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,power_law_1.2,7.202130889892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,power_law_1.01,10.561228942871093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,power_law_1.2,10.723270416259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,power_law_1.01,14.212191772460937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,power_law_1.2,14.468666076660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,power_law_1.01,23.026527404785156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,power_law_1.2,25.292466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,power_law_1.01,50.20004577636719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,power_law_1.2,50.05072021484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,power_law_1.2,0.21512320041656494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,power_law_1.2,0.3302144050598145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,power_law_1.2,0.39443199634552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,power_law_1.2,0.7281472206115722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,power_law_1.2,0.7175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,power_law_1.2,0.735097599029541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,power_law_1.2,0.7392127990722657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,power_law_1.2,0.7457664012908936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,power_law_1.2,0.7486207962036133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,power_law_1.2,0.767411184310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,power_law_1.2,0.79203200340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,power_law_1.2,0.8516096115112305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,power_law_1.2,0.8432255744934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,power_law_1.01,0.214355206489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,power_law_1.2,0.8383296012878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,power_law_1.01,0.3280191898345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,power_law_1.2,0.9054976463317871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,power_law_1.01,0.4334400177001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,power_law_1.2,0.9497280120849609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,power_law_1.01,0.7224703788757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,power_law_1.2,1.0017663955688476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,power_law_1.01,0.7208255767822266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,power_law_1.2,1.2034879684448243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,power_law_1.01,0.7413119792938232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,power_law_1.2,1.4541695594787598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,power_law_1.01,0.7277823925018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,power_law_1.2,1.7714048385620118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,power_law_1.01,0.7523647785186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,power_law_1.2,2.1844480514526365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,power_law_1.01,0.7650623798370362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,power_law_1.2,3.035622406005859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,power_law_1.01,0.7711999893188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,power_law_1.2,3.82174072265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,power_law_1.01,0.7830912113189697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,power_law_1.2,5.543199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,power_law_1.01,0.8092864036560059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,power_law_1.01,0.8440383911132813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,power_law_1.2,9.218323516845704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,power_law_1.01,0.8617280006408692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,power_law_1.01,0.8924544334411622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,power_law_1.2,14.255609130859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,power_law_1.01,0.9354559898376464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,power_law_1.01,1.024345588684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,power_law_1.2,17.186508178710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,power_law_1.01,1.2457152366638184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,power_law_1.01,1.400556755065918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,power_law_1.2,24.0661376953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,power_law_1.01,1.8230592727661132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,power_law_1.01,2.234502410888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,power_law_1.2,35.43971252441406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,power_law_1.01,3.052787208557129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,power_law_1.01,4.200377655029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,power_law_1.01,6.092108917236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,power_law_1.01,9.377721405029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,power_law_1.2,76.241943359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,power_law_1.01,14.753861999511718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,power_law_1.01,20.84093475341797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,power_law_1.01,24.881170654296874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,power_law_1.01,41.99290161132812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,power_law_1.01,82.200439453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,power_law_1.01,0.16680320501327514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,power_law_1.2,0.16520960330963136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,power_law_1.01,0.2673408031463623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,power_law_1.2,0.253875207901001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,power_law_1.01,0.2794431924819946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,power_law_1.2,0.30342400074005127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,power_law_1.01,0.6654911994934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,power_law_1.2,0.5903744220733642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,power_law_1.01,1.0226240158081055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,power_law_1.2,0.8486207962036133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,power_law_1.01,1.4908224105834962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,power_law_1.2,1.23057279586792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,power_law_1.01,2.1005184173583986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,power_law_1.2,2.0194623947143553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,power_law_1.01,2.2606719970703124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,power_law_1.2,2.1923263549804686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,power_law_1.01,2.3313343048095705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,power_law_1.2,2.3333503723144533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,power_law_1.01,2.4152959823608398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,power_law_1.2,2.3940479278564455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,power_law_1.01,2.481983947753906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,power_law_1.2,2.4476991653442384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,power_law_1.2,2.616044807434082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,power_law_1.2,2.695110321044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,power_law_1.2,2.7497663497924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,power_law_1.2,2.8878080368041994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,power_law_1.2,2.9431167602539063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,power_law_1.2,3.077465629577637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,power_law_1.2,3.319744110107422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,power_law_1.2,3.4606464385986326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,power_law_1.2,3.847507095336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,power_law_1.2,3.9359809875488283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,power_law_1.2,4.5176128387451175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,power_law_1.2,5.650969696044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,power_law_1.2,7.047711944580078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,power_law_1.2,8.449638366699219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,power_law_1.2,11.854271697998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,power_law_1.2,14.939289855957032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,power_law_1.2,18.772454833984376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,power_law_1.2,32.19484252929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,power_law_1.2,60.86097412109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,power_law_1.01,0.07626240253448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,power_law_1.01,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,power_law_1.01,0.16064640283584594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,power_law_1.01,0.2589440107345581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,power_law_1.01,0.35192320346832273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,power_law_1.01,0.5825407981872559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,power_law_1.01,0.6103936195373535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,power_law_1.01,0.6320767879486084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,power_law_1.01,0.6658815860748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,power_law_1.01,0.6675136089324951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,power_law_1.01,0.6732607841491699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,power_law_1.01,0.6982463836669922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,power_law_1.01,0.7093120098114014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,power_law_1.01,0.7199552059173584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,power_law_1.01,0.7596799850463867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.09333119988441467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,power_law_1.01,0.7666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,power_law_1.2,0.1568127989768982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,power_law_1.2,0.22889599800109864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,power_law_1.01,0.8002431869506836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,power_law_1.2,0.289516806602478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,power_law_1.01,0.8649408340454101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,power_law_1.2,0.5727615833282471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,power_law_1.01,0.8993599891662598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,power_law_1.2,0.6495552062988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,power_law_1.01,1.0152704238891601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,power_law_1.2,0.6647103786468506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,power_law_1.01,1.157094383239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,power_law_1.2,0.6790463924407959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,power_law_1.01,1.4078911781311034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,power_law_1.2,0.7003456115722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,power_law_1.01,1.6968767166137695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,power_law_1.2,0.6995264053344726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,power_law_1.01,2.1844736099243165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,power_law_1.2,0.708128023147583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,power_law_1.01,2.6626560211181642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,power_law_1.2,0.7126272201538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,power_law_1.01,3.731129455566406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,power_law_1.2,0.7326911926269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,power_law_1.01,4.813286590576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,power_law_1.2,0.7675072193145752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,power_law_1.2,0.7769216060638428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,power_law_1.01,5.820896148681641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,power_law_1.2,0.8101056098937989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,power_law_1.01,11.581311798095703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,power_law_1.2,0.8854911804199219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,power_law_1.2,0.9125120162963867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,power_law_1.2,1.0508928298950195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,power_law_1.01,21.05885467529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,power_law_1.2,1.1555456161499023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,power_law_1.2,1.434483242034912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,power_law_1.2,1.743187141418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,power_law_1.2,2.27710075378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,power_law_1.2,2.758310317993164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,power_law_1.2,3.852422332763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,power_law_1.2,5.6814208984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,power_law_1.2,7.065593719482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,power_law_1.2,11.831999969482421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,power_law_1.2,23.190150451660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,power_law_1.01,2.5483455657958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,power_law_1.01,2.679903984069824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,power_law_1.01,2.7192256927490233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,power_law_1.01,2.8099456787109376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,power_law_1.01,2.844358444213867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,power_law_1.01,2.9934528350830076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,power_law_1.01,3.1441856384277345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,power_law_1.01,3.2840641021728514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,power_law_1.01,3.610310363769531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,power_law_1.01,3.6877246856689454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,power_law_1.01,4.215903854370117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,power_law_1.01,4.742438507080078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,power_law_1.01,5.993568038940429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,power_law_1.01,8.048102569580077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,power_law_1.01,10.6259521484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,power_law_1.01,14.276019287109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,power_law_1.01,18.442477416992187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,power_law_1.01,29.772293090820312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,power_law_1.01,57.68589477539062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,power_law_1.01,0.17278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,power_law_1.01,0.26065280437469485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,power_law_1.01,0.3654975891113281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,power_law_1.01,0.6096127986907959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,power_law_1.01,0.9002240180969239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,power_law_1.01,1.6641408920288085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,power_law_1.01,1.7190143585205078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,power_law_1.01,1.8332992553710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,power_law_1.01,1.8214208602905273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,power_law_1.01,1.871379280090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,power_law_1.01,1.9550975799560546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,power_law_1.01,2.0247871398925783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,power_law_1.01,2.0152896881103515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,power_law_1.01,2.0661504745483397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,power_law_1.01,2.1546304702758787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,power_law_1.01,2.179622459411621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,power_law_1.01,2.2566272735595705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,power_law_1.01,2.470649528503418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,power_law_1.01,2.56115837097168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,power_law_1.01,2.989401626586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,power_law_1.01,3.018476867675781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,power_law_1.01,3.615264129638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,power_law_1.01,5.427347183227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,power_law_1.01,6.700166320800781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,power_law_1.01,8.659910583496094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,power_law_1.01,11.513177490234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,power_law_1.01,14.836402893066406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,power_law_1.01,19.519430541992186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,power_law_1.2,0.17128959894180298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,power_law_1.01,32.07466125488281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,power_law_1.2,0.19585280418395995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,power_law_1.2,0.36789760589599607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,power_law_1.2,0.5857471942901611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,power_law_1.2,0.8301376342773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,power_law_1.01,63.72379150390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,power_law_1.2,1.6087871551513673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,power_law_1.2,1.6665279388427734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,power_law_1.2,1.8184959411621093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,power_law_1.2,1.9112831115722657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,power_law_1.2,1.939936065673828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,power_law_1.2,2.0276031494140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,power_law_1.2,2.087001609802246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,power_law_1.2,2.1060352325439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,power_law_1.2,2.140243148803711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,power_law_1.2,2.208639907836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,power_law_1.2,2.2426496505737306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,power_law_1.2,2.348512077331543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,power_law_1.2,2.601657676696777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,power_law_1.2,2.6897216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,power_law_1.2,3.077401542663574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,power_law_1.2,3.4687744140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,power_law_1.2,4.147488021850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,power_law_1.2,4.440550231933594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,power_law_1.2,5.598899078369141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,power_law_1.2,8.796646118164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,power_law_1.2,11.669798278808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,power_law_1.2,16.11656951904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,power_law_1.2,19.36781463623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,power_law_1.01,0.16581120491027831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,power_law_1.01,0.2694528102874756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,power_law_1.2,32.6026123046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,power_law_1.01,0.45479679107666016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,power_law_1.01,0.569484806060791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,power_law_1.01,1.1474111557006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,power_law_1.2,58.707635498046876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,power_law_1.01,1.7558208465576173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,power_law_1.01,2.1047935485839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,power_law_1.01,2.8398975372314452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,power_law_1.01,3.00775032043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,power_law_1.01,3.1212928771972654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,power_law_1.01,3.2947521209716797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,power_law_1.01,3.4499969482421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,power_law_1.01,3.4819393157958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,power_law_1.01,3.7430591583251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,power_law_1.01,3.701689529418945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,power_law_1.01,3.84832649230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,power_law_1.01,4.000831985473633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,power_law_1.01,4.225715255737304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,power_law_1.01,4.358892822265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,power_law_1.01,4.662118530273437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,power_law_1.01,4.97534065246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,power_law_1.01,5.835161590576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,power_law_1.01,6.592031860351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,power_law_1.01,7.902130889892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,power_law_1.01,10.664883422851563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,power_law_1.01,13.842918395996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,power_law_1.01,16.310322570800782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,power_law_1.01,19.827622985839845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,power_law_1.01,31.60751953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,power_law_1.01,55.818389892578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,power_law_1.2,0.1688447952270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,power_law_1.2,0.26633601188659667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,power_law_1.2,0.3484544038772583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,power_law_1.2,0.5706624031066895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,power_law_1.2,1.0537856101989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,power_law_1.2,1.5158207893371582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,power_law_1.2,1.8598848342895509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,power_law_1.2,2.724563217163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,power_law_1.2,2.801350402832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,power_law_1.2,2.9590463638305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,power_law_1.2,3.1660991668701173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,power_law_1.2,3.294713592529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,power_law_1.2,3.3934207916259767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,power_law_1.2,3.516307067871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,power_law_1.2,3.7761920928955077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,power_law_1.2,3.813875198364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,power_law_1.2,4.013145446777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,power_law_1.2,4.228524780273437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,power_law_1.2,4.635871887207031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,power_law_1.2,4.9851329803466795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,power_law_1.2,5.3395648956298825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,power_law_1.2,6.182112121582032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,power_law_1.2,7.0165245056152346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,power_law_1.2,8.479417419433593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,power_law_1.2,11.394271850585938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,power_law_1.2,14.193760681152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,power_law_1.2,17.93640899658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,power_law_1.2,21.3815673828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,power_law_1.2,31.80894775390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,power_law_1.01,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,power_law_1.01,0.11360000371932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,power_law_1.01,0.13674880266189576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,power_law_1.01,0.23832321166992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,power_law_1.01,0.24078719615936278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,power_law_1.2,68.32625732421874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,power_law_1.01,0.24119040966033936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,power_law_1.01,0.24036478996276855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,power_law_1.01,0.24609920978546143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,power_law_1.01,0.25859200954437256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,power_law_1.01,0.26739840507507323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,power_law_1.01,0.2561471939086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,power_law_1.01,0.2731328010559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,power_law_1.01,0.26924800872802734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,power_law_1.01,0.28972160816192627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,power_law_1.01,0.3169663906097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,power_law_1.01,0.3272063970565796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,power_law_1.01,0.3525952100753784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,power_law_1.01,0.4101439952850342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,power_law_1.01,0.48877439498901365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,power_law_1.01,0.6255871772766113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,power_law_1.01,0.7716159820556641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,power_law_1.01,1.0288384437561036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,power_law_1.01,1.2809599876403808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,power_law_1.01,1.8345279693603516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,power_law_1.01,2.3571712493896486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,power_law_1.01,3.485561752319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,power_law_1.01,5.032691192626953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,power_law_1.01,6.604319763183594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,power_law_1.01,10.733510589599609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,power_law_1.01,22.627833557128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,power_law_1.2,0.09265279769897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,power_law_1.2,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,power_law_1.2,0.14179840087890624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,power_law_1.2,0.23559679985046386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,power_law_1.2,0.2355583906173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,power_law_1.2,0.24378879070281984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,power_law_1.2,0.2446079969406128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,power_law_1.2,0.24973440170288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,power_law_1.2,0.2534143924713135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,power_law_1.2,0.26056320667266847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,power_law_1.2,0.2618112087249756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,power_law_1.2,0.26898560523986814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,power_law_1.2,0.2692032098770142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,power_law_1.2,0.27984640598297117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,power_law_1.2,0.31833600997924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,power_law_1.2,0.3294015884399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,power_law_1.2,0.34065918922424315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,power_law_1.2,0.4131648063659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,power_law_1.2,0.4694784164428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,power_law_1.2,0.6251264095306397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,power_law_1.2,0.7388031959533692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,power_law_1.2,1.0140480041503905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,power_law_1.2,1.2186367988586426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,power_law_1.2,1.759110450744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,power_law_1.2,2.306540870666504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,power_law_1.2,3.354899215698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,power_law_1.2,4.954803085327148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,power_law_1.2,6.317343902587891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,power_law_1.2,10.631180572509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,power_law_1.2,24.338259887695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,power_law_1.01,0.13181439638137818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,power_law_1.01,0.1791424036026001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,power_law_1.01,0.22807679176330567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,power_law_1.01,0.37239038944244385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,power_law_1.01,0.37881600856781006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,power_law_1.01,0.3835200071334839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,power_law_1.01,0.3874111890792847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,power_law_1.01,0.3915071964263916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,power_law_1.01,0.39335041046142577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,power_law_1.01,0.399833607673645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,power_law_1.01,0.40215678215026857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,power_law_1.01,0.40645761489868165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,power_law_1.01,0.41854081153869627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,power_law_1.01,0.43799681663513185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,power_law_1.01,0.47896318435668944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,power_law_1.01,0.5128896236419678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,power_law_1.01,0.5522175788879394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,power_law_1.01,0.6671679973602295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,power_law_1.01,0.7929088115692139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,power_law_1.01,0.995257568359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,power_law_1.01,1.2002623558044434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,power_law_1.01,1.5998335838317872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,power_law_1.01,2.0030784606933594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,power_law_1.01,2.84466552734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,power_law_1.01,3.923276901245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,power_law_1.01,5.879321670532226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,power_law_1.01,8.191244506835938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,power_law_1.01,10.506739044189453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,power_law_1.01,19.269151306152345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,power_law_1.01,0.11256959438323974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,power_law_1.01,40.0599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,power_law_1.01,0.16560640335083007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,power_law_1.01,0.18423680067062378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,power_law_1.01,0.3323199987411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,power_law_1.01,0.5899648189544677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,power_law_1.01,0.7687488079071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,power_law_1.01,1.0790207862854004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,power_law_1.01,1.165452766418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,power_law_1.01,1.219923210144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,power_law_1.01,1.2752191543579101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,power_law_1.01,1.3239616394042968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,power_law_1.01,1.3469120025634767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,power_law_1.01,1.3804863929748534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,power_law_1.01,1.4276032447814941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,power_law_1.01,1.4443903923034669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,power_law_1.01,1.4982591629028321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,power_law_1.01,1.5506752014160157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,power_law_1.01,1.67761287689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,power_law_1.01,1.7608064651489257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,power_law_1.01,1.9555648803710937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,power_law_1.01,2.0338111877441407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,power_law_1.01,2.436639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,power_law_1.01,2.768627166748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,power_law_1.01,3.4396800994873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,power_law_1.01,4.556864166259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,power_law_1.01,5.979679870605469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,power_law_1.01,7.479641723632812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,power_law_1.01,9.095916748046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,power_law_1.2,0.11374080181121826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,power_law_1.2,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,power_law_1.01,14.133932495117188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,power_law_1.2,0.2003711938858032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,power_law_1.2,0.32756481170654295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,power_law_1.01,28.688314819335936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,power_law_1.2,0.5182208061218262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,power_law_1.2,0.6809599876403809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,power_law_1.2,1.0912575721740723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,power_law_1.2,1.121548843383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,power_law_1.2,1.1997952461242676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,power_law_1.2,1.2374784469604492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,power_law_1.2,1.3270976066589355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,power_law_1.2,1.3714176177978517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,power_law_1.2,1.3562687873840331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,power_law_1.2,1.436953639984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,power_law_1.2,1.5211392402648927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,power_law_1.2,1.5670016288757325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,power_law_1.2,1.654630470275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,power_law_1.2,0.13014400005340576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,power_law_1.2,1.7832704544067384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,power_law_1.2,0.16147840023040771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,power_law_1.2,0.1893056035041809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,power_law_1.2,1.8606719970703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,power_law_1.2,0.3666815996170044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,power_law_1.2,2.0615936279296876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,power_law_1.2,0.38255360126495364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,power_law_1.2,0.379801607131958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,power_law_1.2,2.172185516357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,power_law_1.2,0.38102400302886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,power_law_1.2,0.39495038986206055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,power_law_1.2,2.4959808349609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,power_law_1.2,0.40970239639282224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,power_law_1.2,2.8762752532958986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,power_law_1.2,0.41726078987121584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,power_law_1.2,0.40453758239746096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,power_law_1.2,3.5121791839599608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,power_law_1.2,0.41870718002319335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,power_law_1.2,4.667462539672852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,power_law_1.2,0.4228096008300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,power_law_1.2,0.4494272232055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,power_law_1.2,6.142444610595703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,power_law_1.2,0.4989823818206787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,power_law_1.2,0.5194496154785156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,power_law_1.2,7.721234893798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,power_law_1.2,0.5419775962829589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,power_law_1.2,0.6507455825805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,power_law_1.2,9.3608642578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,power_law_1.2,0.7437183856964111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,power_law_1.2,0.964083194732666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,power_law_1.2,15.035264587402343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,power_law_1.2,1.163360023498535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,power_law_1.2,1.6358272552490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,power_law_1.2,2.0177791595458983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,power_law_1.2,2.854591941833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,power_law_1.2,32.25118713378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,power_law_1.2,3.7269630432128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,power_law_1.2,5.549280166625977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,power_law_1.2,8.002777862548829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,power_law_1.2,10.515277099609374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,power_law_1.01,0.06340479850769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,power_law_1.2,18.845791625976563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,power_law_1.01,0.1090880036354065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,power_law_1.01,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,power_law_1.2,37.451864624023436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,power_law_1.01,0.2055488109588623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,power_law_1.01,0.3196223974227905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,power_law_1.01,0.34276480674743653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,power_law_1.01,0.3464384078979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,power_law_1.01,0.3614016056060791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,power_law_1.01,0.3721024036407471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,power_law_1.01,0.3779776096343994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,power_law_1.01,0.39089920520782473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,power_law_1.01,0.38331520557403564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,power_law_1.01,0.3996031999588013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,power_law_1.01,0.4162879943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,power_law_1.01,0.43349761962890626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,power_law_1.01,0.4445184230804443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,power_law_1.01,0.4977280139923096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,power_law_1.01,0.5276991844177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,power_law_1.01,0.6152512073516846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,power_law_1.01,0.691264009475708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,power_law_1.01,0.874835205078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,power_law_1.01,1.0378560066223144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,power_law_1.01,1.3730560302734376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,power_law_1.01,1.6856319427490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,power_law_1.01,2.345305633544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,power_law_1.01,2.982028770446777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,power_law_1.01,3.6590206146240236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,power_law_1.01,5.69944953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,power_law_1.01,13.20642547607422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,power_law_1.2,0.1011072039604187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,power_law_1.2,0.13511040210723876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,power_law_1.2,0.1789247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,power_law_1.2,0.3153215885162354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,power_law_1.2,0.355679988861084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,power_law_1.2,0.3538304090499878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,power_law_1.2,0.3732800006866455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,power_law_1.2,0.3759552001953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,power_law_1.2,0.3847552061080933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,power_law_1.2,0.3951936006546021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,power_law_1.2,0.4081024169921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,power_law_1.2,0.41895041465759275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,power_law_1.2,0.4265279769897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,power_law_1.2,0.4445504188537598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,power_law_1.2,0.4564352035522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,power_law_1.2,0.5162303924560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,power_law_1.2,0.5387263774871827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,power_law_1.2,0.6288703918457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,power_law_1.2,0.7249216079711914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,power_law_1.2,0.8863039970397949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,power_law_1.2,1.0667327880859374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,power_law_1.2,1.3944128036499024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,power_law_1.2,1.7136959075927733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,power_law_1.2,2.369068717956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,power_law_1.2,3.057369613647461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,power_law_1.2,3.809414291381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,power_law_1.2,6.0119678497314455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,power_law_1.2,12.989369201660157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,power_law_1.01,0.1131327986717224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,power_law_1.01,0.15122560262680054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,power_law_1.01,0.21758079528808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,power_law_1.01,0.3535615921020508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,power_law_1.01,0.495692777633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,power_law_1.01,0.8223487854003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,power_law_1.01,0.8919872283935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,power_law_1.01,0.9345791816711426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,power_law_1.01,0.9602432250976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,power_law_1.01,0.9853695869445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,power_law_1.2,0.11806080341339112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,power_law_1.01,1.0288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,power_law_1.2,0.12112640142440796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,power_law_1.01,1.0229632377624511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,power_law_1.2,0.21001598834991456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,power_law_1.01,1.0736448287963867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,power_law_1.2,0.3109823942184448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,power_law_1.01,1.0793727874755858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,power_law_1.2,0.4494272232055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,power_law_1.01,1.123200035095215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,power_law_1.2,0.8272640228271484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,power_law_1.01,1.14900484085083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,power_law_1.2,0.8841983795166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,power_law_1.01,1.1776767730712892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,power_law_1.2,0.9489343643188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,power_law_1.01,1.2804927825927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,power_law_1.2,0.9825216293334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,power_law_1.01,1.3820672035217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,power_law_1.2,0.9976767539978028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,power_law_1.01,1.5686400413513184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,power_law_1.2,1.0492671966552733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,power_law_1.01,1.653830337524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,power_law_1.2,1.0806015968322753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,power_law_1.01,1.9641088485717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,power_law_1.2,1.1088640213012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,power_law_1.01,2.3771839141845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,power_law_1.2,1.105183982849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,power_law_1.01,3.0138431549072267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,power_law_1.2,1.1580160140991211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,power_law_1.01,4.305984115600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,power_law_1.2,1.1739968299865722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,power_law_1.01,5.722803115844727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,power_law_1.2,1.2170047760009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,power_law_1.01,6.907769775390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,power_law_1.2,1.3144895553588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,power_law_1.2,1.4168319702148438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,power_law_1.01,8.52323226928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,power_law_1.2,1.6145151138305665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,power_law_1.2,1.6877759933471679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,power_law_1.01,14.359417724609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,power_law_1.2,2.021452713012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,power_law_1.2,3.0393280029296874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,power_law_1.01,30.56604919433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,power_law_1.2,3.6848384857177736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,power_law_1.2,4.326822280883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,power_law_1.2,5.745318222045898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,power_law_1.2,7.121715545654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,power_law_1.2,8.78067855834961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,power_law_1.2,15.573426818847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,power_law_1.2,27.195864868164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,1,power_law_1.01,0.04840959906578064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,1,power_law_1.01,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,1,power_law_1.01,0.07587839961051941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,1,power_law_1.01,0.12334719896316529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,1,power_law_1.01,0.12787840366363526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,1,power_law_1.01,0.15000319480895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,1,power_law_1.01,0.15204479694366455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,1,power_law_1.01,0.15818239450454713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,power_law_1.01,0.11318399906158447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,1,power_law_1.01,0.1534783959388733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,1,power_law_1.01,0.15408639907836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,power_law_1.01,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,1,power_law_1.01,0.16205439567565919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,power_law_1.01,0.26472959518432615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,1,power_law_1.01,0.18910720348358154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,1,power_law_1.01,0.20119040012359618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,1,power_law_1.2,0.0486272007226944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,power_law_1.01,0.3345599889755249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,1,power_law_1.01,0.222707200050354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,1,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,power_law_1.01,0.6556992053985595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,1,power_law_1.01,0.2556735992431641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,1,power_law_1.2,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,1,power_law_1.01,0.28188159465789797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,1,power_law_1.2,0.12378879785537719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,power_law_1.01,0.9342144012451172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,1,power_law_1.2,0.13401600122451782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,1,power_law_1.01,0.3345151901245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,power_law_1.01,1.13307523727417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,1,power_law_1.2,0.15082240104675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,1,power_law_1.01,0.44654078483581544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,1,power_law_1.2,0.1524672031402588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.01,0.5407487869262695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,power_law_1.01,1.5047871589660644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,1,power_law_1.2,0.156550395488739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.01,0.7777152061462402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,power_law_1.01,1.5625408172607422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,1,power_law_1.2,0.15408639907836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.01,0.9968447685241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,1,power_law_1.2,0.15676800012588502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.01,1.4406399726867676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,power_law_1.01,1.6206911087036133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,1,power_law_1.2,0.1641343951225281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.01,1.889369583129883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,1,power_law_1.2,0.20018560886383058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,power_law_1.01,1.718604850769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.01,2.7820863723754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,1,power_law_1.2,0.20364160537719728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,power_law_1.01,1.7874176025390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.01,3.6897537231445314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,1,power_law_1.2,0.22495999336242675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,1,power_law_1.2,0.25527679920196533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.01,5.469049453735352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,power_law_1.01,1.839846420288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,1,power_law_1.2,0.27903358936309813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.01,7.2704833984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,1,power_law_1.2,0.33596799373626707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,power_law_1.01,1.8844863891601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,1,power_law_1.2,0.4465536117553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,1,power_law_1.01,9.065126037597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,power_law_1.01,1.9567808151245116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.2,0.5465023994445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.2,0.7785408020019531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,1,power_law_1.01,14.457933044433593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,power_law_1.01,2.042393684387207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.2,0.9968192100524902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,power_law_1.01,2.0931840896606446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.2,1.4512895584106444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,1,power_law_1.01,28.809707641601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.2,1.8909952163696289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,power_law_1.01,2.220569610595703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.2,2.789049530029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,power_law_1.01,2.30371208190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.2,3.6806846618652345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.2,5.486687850952149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,power_law_1.01,2.550092887878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.2,7.282771301269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,power_law_1.01,2.7319616317749023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,1,power_law_1.2,9.074150085449219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,power_law_1.01,3.1845632553100587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,power_law_1.2,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,1,power_law_1.2,14.441958618164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,power_law_1.01,3.4655487060546877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,power_law_1.2,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,power_law_1.01,4.271641540527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,power_law_1.2,0.19612799882888793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,1,power_law_1.2,28.821978759765624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,power_law_1.2,0.33089919090270997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,power_law_1.01,5.91038703918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,power_law_1.2,0.5559679985046386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,power_law_1.01,7.331552124023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,power_law_1.2,0.7970047950744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,power_law_1.01,8.766770935058593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,power_law_1.2,1.0194175720214844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,power_law_1.2,1.434547233581543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,1,power_law_1.01,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,power_law_1.01,10.453523254394531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,1,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,power_law_1.2,1.5052032470703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,1,power_law_1.01,0.10311039686203002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,power_law_1.01,15.078944396972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,power_law_1.2,1.5494336128234862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,1,power_law_1.01,0.169868803024292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,1,power_law_1.01,0.16925439834594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,power_law_1.2,1.663724708557129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,1,power_law_1.01,0.17088639736175537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,1,power_law_1.01,0.17169920206069947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,power_law_1.2,1.7329408645629882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,power_law_1.01,33.395416259765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,1,power_law_1.01,0.1700543999671936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,power_law_1.2,1.7882368087768554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,1,power_law_1.01,0.1717120051383972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,1,power_law_1.01,0.17742079496383667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,power_law_1.2,1.9100992202758789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,1,power_law_1.01,0.17989120483398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,power_law_1.2,1.9768640518188476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,1,power_law_1.2,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,1,power_law_1.01,0.19034240245819092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,1,power_law_1.2,0.08895999789237977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,1,power_law_1.01,0.19362560510635377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,power_law_1.2,1.9809471130371095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,1,power_law_1.2,0.11847039461135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,1,power_law_1.01,0.19649280309677125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,1,power_law_1.2,0.16639360189437866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,power_law_1.2,2.116134452819824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,1,power_law_1.01,0.22351999282836915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,1,power_law_1.2,0.1676095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,1,power_law_1.01,0.22844159603118896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,power_law_1.2,2.2828351974487306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,1,power_law_1.2,0.17169920206069947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,1,power_law_1.01,0.24562559127807618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,1,power_law_1.2,0.17171839475631714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,power_law_1.2,2.4247488021850585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,1,power_law_1.01,0.2935551881790161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,1,power_law_1.2,0.1725376009941101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.01,0.33452160358428956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,power_law_1.2,2.684441566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,1,power_law_1.2,0.17415679693222047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.01,0.4432640075683594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,1,power_law_1.2,0.18052480220794678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,power_law_1.2,2.869772720336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.01,0.5202816009521485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,1,power_law_1.2,0.18338559865951537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.01,0.7003007888793945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,power_law_1.2,3.415584182739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,1,power_law_1.2,0.1905408024787903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.01,0.8508159637451171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,1,power_law_1.01,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,1,power_law_1.2,0.19422719478607178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,power_law_1.2,3.735276794433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.01,1.1957056045532226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,1,power_law_1.2,0.2053056001663208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,1,power_law_1.01,0.09658240079879761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.01,1.5452927589416503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,1,power_law_1.01,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,1,power_law_1.2,0.22394239902496338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,power_law_1.2,4.500812911987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.01,2.2930368423461913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,1,power_law_1.2,0.22660479545593262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,1,power_law_1.01,0.19510400295257568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,1,power_law_1.2,0.24298880100250245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,power_law_1.2,6.262911987304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,1,power_law_1.01,0.21292800903320314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.01,3.0495487213134767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,1,power_law_1.2,0.29602560997009275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,1,power_law_1.01,0.2704576015472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,1,power_law_1.01,3.899059295654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,power_law_1.2,7.755289459228516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.2,0.3453759908676147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,1,power_law_1.01,0.2516223907470703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,1,power_law_1.01,6.253023910522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.2,0.4358975887298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,1,power_law_1.01,0.27948799133300783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,power_law_1.2,9.150387573242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.2,0.5354432106018067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,1,power_law_1.01,0.24833281040191652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,1,power_law_1.01,12.672473907470703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.2,0.708076810836792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,1,power_law_1.01,0.2544895887374878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,power_law_1.2,10.989491271972657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,1,power_law_1.01,0.28358399868011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.2,0.8558848381042481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,1,power_law_1.01,0.3065023899078369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.2,1.2243712425231934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,1,power_law_1.01,0.3128511905670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.2,1.5698687553405761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,power_law_1.2,15.558380126953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,1,power_law_1.01,0.3699712038040161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.2,2.297113609313965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,1,power_law_1.01,0.39539198875427245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.2,3.044223976135254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,1,power_law_1.01,0.45354881286621096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,1,power_law_1.2,3.9183040618896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,power_law_1.2,33.63955078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,1,power_law_1.01,0.5301439762115479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,1,power_law_1.01,0.7293568134307862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,1,power_law_1.2,6.294745635986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.01,0.9252032279968262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,1,power_law_1.2,12.934835815429688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.01,1.2853631973266602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.01,1.671436882019043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.01,2.4116416931152345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.01,3.1693248748779297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.01,4.685152053833008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.01,6.18139533996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,1,power_law_1.2,0.06850559711456299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.01,9.2052734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,1,power_law_1.2,0.06971520185470581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,1,power_law_1.2,0.06951680183410644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.01,12.221778869628906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,1,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,1,power_law_1.2,0.10432640314102173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,1,power_law_1.01,15.246450805664063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,1,power_law_1.2,0.1608448028564453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,1,power_law_1.2,0.12744959592819213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,1,power_law_1.01,24.289202880859374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,1,power_law_1.2,0.16514559984207153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,1,power_law_1.2,0.12951040267944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,1,power_law_1.2,0.13073279857635497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,1,power_law_1.01,48.40904846191406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,1,power_law_1.2,0.17043839693069457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,1,power_law_1.2,0.17640960216522217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,1,power_law_1.2,0.17825920581817628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,1,power_law_1.2,0.22863359451293946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,1,power_law_1.2,0.2767616033554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,1,power_law_1.2,0.31875200271606446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,1,power_law_1.2,0.4203328132629395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,1,power_law_1.2,0.6030144214630127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.2,0.7969471931457519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,1,power_law_1.01,0.10767999887466431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.2,1.1735808372497558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,1,power_law_1.01,0.13551360368728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.2,1.5506175994873046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,1,power_law_1.01,0.1707327961921692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.2,2.303660774230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,1,power_law_1.2,0.10700160264968872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,1,power_law_1.01,0.2456831932067871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.2,3.054047966003418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,1,power_law_1.2,0.14263039827346802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,1,power_law_1.01,0.2551039934158325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,1,power_law_1.2,0.15532159805297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.2,4.572441482543946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,1,power_law_1.01,0.25614080429077146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,1,power_law_1.01,0.05194240212440491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,1,power_law_1.2,0.24995200634002684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,1,power_law_1.01,0.25264639854431153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.2,6.082841491699218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,1,power_law_1.01,0.08595200181007386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,1,power_law_1.2,0.24728960990905763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,1,power_law_1.01,0.25880959033966067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.2,9.107347106933593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,1,power_law_1.01,0.09373440146446228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,1,power_law_1.2,0.2540287971496582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,1,power_law_1.01,0.26104960441589353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,1,power_law_1.2,0.25771520137786863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,1,power_law_1.01,0.26083199977874755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,1,power_law_1.01,0.14369920492172242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.2,12.12833251953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,1,power_law_1.2,0.2603967905044556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,1,power_law_1.01,0.26883199214935305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,1,power_law_1.01,0.347871994972229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,1,power_law_1.2,0.26100480556488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,1,power_law_1.2,15.157119750976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,1,power_law_1.01,0.2755840063095093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,1,power_law_1.2,0.26447999477386475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,1,power_law_1.01,0.4152512073516846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,1,power_law_1.01,0.2850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,1,power_law_1.2,0.26735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,1,power_law_1.01,0.2931904077529907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,1,power_law_1.2,24.23588409423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,1,power_law_1.01,0.5125440120697021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,1,power_law_1.2,0.28107519149780275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,1,power_law_1.01,0.3298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,1,power_law_1.01,0.5588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,1,power_law_1.2,0.2900799989700317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,1,power_law_1.01,0.34050559997558594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,1,power_law_1.2,0.29212799072265627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,1,power_law_1.01,0.5817728042602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,1,power_law_1.01,0.3657088041305542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,1,power_law_1.2,48.435675048828124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,1,power_law_1.2,0.32816638946533205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,1,power_law_1.01,0.44700160026550295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,1,power_law_1.01,0.608787202835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,1,power_law_1.2,0.3318527936935425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.01,0.5117184162139893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,1,power_law_1.01,0.6659327983856201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,1,power_law_1.2,0.3662847995758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.01,0.631712007522583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,1,power_law_1.2,0.434662389755249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,1,power_law_1.01,0.713043212890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.01,0.7523583889007568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.2,0.5145343780517578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.01,0.9952447891235352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,1,power_law_1.01,0.7580927848815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.2,0.6359807968139648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.01,1.2313856124877929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,1,power_law_1.01,0.8449215888977051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.2,0.7449344158172607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.01,1.7460479736328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,1,power_law_1.01,0.7662784099578858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.2,0.9865983963012696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.01,2.3053632736206056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.2,1.2174079895019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,1,power_law_1.01,0.8428671836853028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.01,3.422547149658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.2,1.7451711654663087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,1,power_law_1.01,0.9133248329162598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.01,4.502041625976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.2,2.263942337036133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,1,power_law_1.01,0.8936767578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,1,power_law_1.01,5.624351882934571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.2,3.362278366088867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,1,power_law_1.2,0.052102398872375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.01,0.9559295654296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,1,power_law_1.01,9.337158203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.2,4.549100875854492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,1,power_law_1.2,0.07994880080223084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.01,1.3297087669372558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,1,power_law_1.2,5.832582473754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,1,power_law_1.01,20.856959533691406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,1,power_law_1.2,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.01,1.5502528190612792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,1,power_law_1.2,9.278508758544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,1,power_law_1.2,0.14832639694213867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.01,1.9936447143554688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,1,power_law_1.2,0.3058495998382568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,1,power_law_1.2,20.111634826660158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.01,2.4550655364990233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,1,power_law_1.2,0.34803199768066406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.01,3.341843032836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,1,power_law_1.2,0.48545279502868655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.01,4.225350570678711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,1,power_law_1.2,0.53788161277771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,1,power_law_1.2,0.5702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.01,6.079967880249024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,1,power_law_1.2,0.5968704223632812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.01,7.870572662353515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,1,power_law_1.2,0.667526388168335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,1,power_law_1.2,0.7232384204864502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,1,power_law_1.01,9.668319702148438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,1,power_law_1.2,0.7801472187042237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,1,power_law_1.01,15.10106201171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,1,power_law_1.2,0.8407423973083497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,1,power_law_1.2,0.781388807296753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,1,power_law_1.2,0.8289024353027343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,1,power_law_1.01,29.564453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,1,power_law_1.2,0.9145024299621582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,1,power_law_1.2,0.8751232147216796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.2,1.017728042602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.2,1.3299903869628906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.2,1.5162176132202148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,1,power_law_1.01,0.02818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.2,2.0407039642333986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,1,power_law_1.01,0.11829760074615478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,1,power_law_1.01,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.2,2.451321601867676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,1,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.2,3.370470428466797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,1,power_law_1.01,0.07816960215568543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,1,power_law_1.2,0.12174719572067261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,1,power_law_1.01,0.11521919965744018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.2,4.2224384307861325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,1,power_law_1.2,0.1618880033493042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,1,power_law_1.01,0.1678655982017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.2,5.990694427490235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,1,power_law_1.2,0.1692415952682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,1,power_law_1.01,0.18156800270080567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,1,power_law_1.01,0.1817919969558716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,1,power_law_1.2,0.2687936067581177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.2,7.8676605224609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,1,power_law_1.01,0.1789247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,1,power_law_1.2,0.36525440216064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,1,power_law_1.2,9.685881805419921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,1,power_law_1.01,0.18588800430297853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,1,power_law_1.2,0.5116864204406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,1,power_law_1.01,0.20555520057678223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,1,power_law_1.2,0.7863039970397949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,1,power_law_1.2,15.101823425292968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,1,power_law_1.01,0.19367680549621583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,1,power_law_1.2,0.8194944381713867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,1,power_law_1.01,0.20142719745635987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,1,power_law_1.2,0.8682432174682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,1,power_law_1.01,0.22622079849243165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,1,power_law_1.2,29.585272216796874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,1,power_law_1.2,0.8760128021240234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,1,power_law_1.01,0.2103872060775757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,1,power_law_1.2,0.9345855712890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,1,power_law_1.01,0.22190721035003663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,1,power_law_1.01,0.2342207908630371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,1,power_law_1.2,0.9628416061401367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,1,power_law_1.01,0.32309119701385497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,1,power_law_1.2,0.988646411895752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.01,0.36528639793395995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,1,power_law_1.2,1.0193728446960448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,1,power_law_1.2,0.028748801350593566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.01,0.45929598808288574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,1,power_law_1.2,1.070361614227295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,1,power_law_1.2,0.033881598711013795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.01,0.5707007884979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,1,power_law_1.2,1.1006784439086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,1,power_law_1.2,0.0500544011592865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.01,0.769977617263794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,1,power_law_1.2,1.143289566040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,1,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.01,0.9755904197692871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,1,power_law_1.2,1.3083392143249513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,1,power_law_1.2,0.10657919645309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.01,1.3853759765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,1,power_law_1.2,0.17169920206069947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.2,1.3820799827575683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.01,1.7837440490722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,1,power_law_1.2,0.19095040559768678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.2,1.5924032211303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.01,2.584511947631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,1,power_law_1.2,0.18173439502716066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.2,1.6567039489746094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.01,3.3942718505859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,1,power_law_1.2,0.18666239976882934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.2,1.9559232711791992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,1,power_law_1.2,0.19011839628219604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,1,power_law_1.01,4.210604858398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,1,power_law_1.2,0.21389439105987548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.2,2.367763137817383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,1,power_law_1.01,6.672710418701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,1,power_law_1.2,0.20446720123291015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.2,2.9061887741088865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,1,power_law_1.2,0.2124608039855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,1,power_law_1.01,13.219558715820312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.2,3.4081600189208983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,1,power_law_1.2,0.21778559684753418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,1,power_law_1.2,0.21470720767974855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.2,4.447923278808593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,1,power_law_1.2,0.21921279430389404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.2,5.578425598144531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,1,power_law_1.2,0.2454080104827881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,1,power_law_1.2,0.32605440616607667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,1,power_law_1.2,6.663597106933594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.2,0.37978239059448243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.2,0.47681279182434083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,1,power_law_1.2,10.150374603271484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.2,0.5751488208770752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.2,0.7609151840209961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,1,power_law_1.2,19.612953186035156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.2,0.9754752159118653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.2,1.3779840469360352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.2,1.7808128356933595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,1,power_law_1.01,0.06526079773902893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.2,2.584147262573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,1,power_law_1.01,0.07509120106697083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.2,3.392582321166992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,1,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,1,power_law_1.01,0.1355839967727661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,1,power_law_1.2,4.21712646484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,1,power_law_1.01,0.16785279512405396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,1,power_law_1.2,6.6816764831542965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,1,power_law_1.01,0.26978559494018556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,1,power_law_1.01,0.2798847913742065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,1,power_law_1.2,13.198200988769532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,1,power_law_1.01,0.2830976009368896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,1,power_law_1.01,0.29564800262451174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,1,power_law_1.2,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,1,power_law_1.01,0.3052799940109253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,1,power_law_1.2,0.07771520018577575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,1,power_law_1.01,0.3116352081298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,1,power_law_1.2,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,1,power_law_1.01,0.31449599266052247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,1,power_law_1.2,0.12399359941482543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,1,power_law_1.01,0.31710081100463866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,1,power_law_1.2,0.15287679433822632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,1,power_law_1.01,0.33000319004058837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,1,power_law_1.2,0.2628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,1,power_law_1.01,0.34494719505310056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,1,power_law_1.2,0.2825151920318604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,1,power_law_1.01,0.35895040035247805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,1,power_law_1.2,0.2968319892883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,1,power_law_1.01,0.05538560152053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,1,power_law_1.01,0.3835135936737061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,1,power_law_1.2,0.29767038822174074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,1,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,1,power_law_1.01,0.45151357650756835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,1,power_law_1.2,0.3066751956939697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,1,power_law_1.01,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.01,0.47315201759338377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,1,power_law_1.2,0.31157760620117186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.01,0.5682496070861817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,1,power_law_1.01,0.1545024037361145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,1,power_law_1.2,0.3169152021408081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.01,0.6745344161987304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,1,power_law_1.01,0.2390592098236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,1,power_law_1.2,0.33085439205169676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,1,power_law_1.01,0.3699392080307007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.01,0.8471936225891114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,1,power_law_1.2,0.34375040531158446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,1,power_law_1.01,0.4139711856842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.01,1.0124544143676757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,1,power_law_1.2,0.3607232093811035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,1,power_law_1.01,0.4477759838104248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.01,1.332147216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,1,power_law_1.2,0.36995840072631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,1,power_law_1.01,0.49240961074829104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.01,1.6379072189331054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,1,power_law_1.2,0.3965888023376465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,1,power_law_1.01,0.4772672176361084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.01,2.2902015686035155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,1,power_law_1.2,0.46211838722229004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,1,power_law_1.01,0.5448448181152343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.2,0.4826047897338867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.01,2.954579162597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,1,power_law_1.01,0.5731135845184326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.2,0.5665664196014404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,1,power_law_1.01,3.5783935546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,1,power_law_1.01,0.5235455989837646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.2,0.6880127906799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,1,power_law_1.01,0.5755648136138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.2,0.852672004699707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,1,power_law_1.01,5.480160140991211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,1,power_law_1.01,0.6046656131744385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.2,1.013260841369629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,1,power_law_1.01,0.5768064022064209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,1,power_law_1.01,11.055436706542968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.2,1.3316927909851075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,1,power_law_1.01,0.6128384113311768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.2,1.6579391479492187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,1,power_law_1.01,0.8166208267211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.2,2.281491279602051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.01,0.9161600112915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.2,2.977868843078613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.01,1.1637439727783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,1,power_law_1.2,3.6487998962402344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.01,1.3824640274047852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,1,power_law_1.2,5.598489761352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.01,1.8619136810302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.01,2.3358272552490233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,1,power_law_1.2,11.201414489746094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.01,3.2938751220703124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,1,power_law_1.2,0.053990399837493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,1,power_law_1.2,0.05615360140800476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.01,4.263398361206055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,1,power_law_1.2,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.01,6.208345413208008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,1,power_law_1.2,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.01,8.151929473876953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,1,power_law_1.2,0.23559679985046386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,1,power_law_1.2,0.3708224058151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,1,power_law_1.01,10.06292495727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,1,power_law_1.2,0.43717122077941895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,1,power_law_1.2,0.43506560325622556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,1,power_law_1.01,15.884165954589843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,1,power_law_1.2,0.5051712036132813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,1,power_law_1.2,0.5064000129699707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,1,power_law_1.2,0.5469567775726318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,1,power_law_1.01,31.330380249023438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,1,power_law_1.2,0.5932352066040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,1,power_law_1.2,0.5628543853759765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,1,power_law_1.2,0.5820928096771241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,1,power_law_1.2,0.6475071907043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,1,power_law_1.2,0.5756224155426025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,1,power_law_1.2,0.6372608184814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,1,power_law_1.2,0.8194687843322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.2,0.9308799743652344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.2,1.1736448287963868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.2,1.4243136405944825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,1,power_law_1.01,0.11559679508209228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,1,power_law_1.01,0.13444479703903198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.2,1.9289344787597655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,1,power_law_1.01,0.17499519586563111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.2,2.3805055618286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,1,power_law_1.01,0.2581248044967651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.2,3.3127681732177736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,1,power_law_1.01,0.3560319900512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.2,4.312601470947266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,1,power_law_1.01,0.5612287998199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.2,6.268243026733399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,1,power_law_1.01,0.6368192195892334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,1,power_law_1.01,0.6564671993255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.2,8.195200347900391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,1,power_law_1.01,0.6654719829559326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,1,power_law_1.2,10.076493072509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,1,power_law_1.01,0.6850687980651855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,1,power_law_1.01,0.7146431922912597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,1,power_law_1.2,15.873126220703124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,1,power_law_1.01,0.7105535984039306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,1,power_law_1.2,0.115174400806427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,1,power_law_1.2,0.1223423957824707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,1,power_law_1.01,0.725273609161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,1,power_law_1.01,0.15599360466003417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,1,power_law_1.2,0.165555202960968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,1,power_law_1.01,0.7551936149597168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,1,power_law_1.01,0.17319680452346803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,1,power_law_1.2,31.32878723144531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,1,power_law_1.01,0.7850880146026611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,1,power_law_1.2,0.26774399280548095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,1,power_law_1.01,0.2893183946609497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,1,power_law_1.2,0.3140352010726929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,1,power_law_1.01,0.8117055892944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,1,power_law_1.01,0.4400512218475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,1,power_law_1.01,0.8669952392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,1,power_law_1.2,0.5616384029388428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,1,power_law_1.01,0.5526847839355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,1,power_law_1.2,0.6271872043609619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,1,power_law_1.01,0.9763584136962891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,1,power_law_1.01,0.7798079967498779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,1,power_law_1.2,0.6589183807373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.01,1.0576767921447754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,1,power_law_1.01,0.8539392471313476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,1,power_law_1.2,0.6871808052062989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.01,1.2763968467712403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,1,power_law_1.01,0.8826111793518067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,1,power_law_1.2,0.681440019607544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.01,1.2890943527221679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,1,power_law_1.01,0.9137408256530761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,1,power_law_1.2,0.735103988647461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.01,1.60263671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,1,power_law_1.01,0.9072064399719239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,1,power_law_1.2,0.7412479877471924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.01,1.9211008071899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,1,power_law_1.01,0.9502143859863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,1,power_law_1.2,0.7658368110656738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.01,2.45665283203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,1,power_law_1.01,0.9669952392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,1,power_law_1.2,0.7793407917022706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.01,2.971718406677246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,1,power_law_1.01,1.0288384437561036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,1,power_law_1.2,0.7944896221160889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,1,power_law_1.01,1.0439935684204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.01,4.072934341430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,1,power_law_1.2,0.836678409576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,1,power_law_1.01,1.082700824737549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.01,5.158784103393555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,1,power_law_1.2,0.8981184005737305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,1,power_law_1.01,1.130624008178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,1,power_law_1.01,6.22149772644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,1,power_law_1.2,1.0029888153076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,1,power_law_1.01,1.2403776168823242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.2,1.0679167747497558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.01,1.3239616394042968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,1,power_law_1.01,9.654354858398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.2,1.2555071830749511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.01,1.5490367889404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.2,1.3173503875732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.01,1.6027135848999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,1,power_law_1.01,19.22362823486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.2,1.6059135437011718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.01,1.90435848236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.2,1.9423999786376953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.01,2.2316287994384765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.2,2.459929656982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,1,power_law_1.01,0.13530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.2,3.0114559173583983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.01,2.8210432052612306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,1,power_law_1.01,0.17358720302581787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.2,4.046720123291015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.01,3.353305435180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,1,power_law_1.01,0.23893120288848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.01,4.530303955078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.2,5.447750473022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,1,power_law_1.01,0.28048000335693357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,1,power_law_1.01,0.4969791889190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,1,power_law_1.2,6.619001770019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.01,5.517792129516602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,1,power_law_1.01,0.6876416206359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,1,power_law_1.01,6.585075378417969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,1,power_law_1.2,9.790329742431641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,1,power_law_1.01,0.7994688034057618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,1,power_law_1.01,9.890943908691407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,1,power_law_1.01,1.052518367767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,1,power_law_1.2,19.43169250488281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,1,power_law_1.01,1.1113727569580079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,1,power_law_1.01,19.520845031738283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,1,power_law_1.01,1.1683072090148925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,1,power_law_1.01,1.2149951934814454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,1,power_law_1.01,1.271059226989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,1,power_law_1.01,1.3059391975402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,1,power_law_1.01,1.3116607666015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,1,power_law_1.01,1.3726335525512696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,1,power_law_1.01,1.4075200080871582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,1,power_law_1.01,1.4488960266113282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,1,power_law_1.01,1.604319953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,1,power_law_1.2,0.1377087950706482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,1,power_law_1.01,1.6657663345336915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,1,power_law_1.2,0.17294080257415773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,1,power_law_1.01,1.936307144165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,1,power_law_1.2,0.19833600521087646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,1,power_law_1.01,2.1390592575073244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,1,power_law_1.2,0.28108160495758056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,1,power_law_1.2,0.43427200317382814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,1,power_law_1.01,2.559916877746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,1,power_law_1.2,0.5899136066436768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,1,power_law_1.01,2.636940765380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,1,power_law_1.2,0.7261184215545654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,1,power_law_1.01,3.300902557373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,1,power_law_1.2,0.9808896064758301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,1,power_law_1.01,3.983488082885742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,1,power_law_1.2,1.045580768585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,1,power_law_1.01,5.075680160522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,1,power_law_1.2,1.1219776153564454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,1,power_law_1.01,6.3464702606201175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,1,power_law_1.2,1.177286434173584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,1,power_law_1.01,7.532275390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,1,power_law_1.2,1.200224018096924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,1,power_law_1.2,1.266585636138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,1,power_law_1.01,10.77158432006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,1,power_law_1.2,1.3321151733398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,1,power_law_1.2,1.376352024078369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,1,power_law_1.01,19.633421325683592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,1,power_law_1.2,1.4115584373474122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,1,power_law_1.2,1.490828800201416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,1,power_law_1.2,1.6814271926879882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,1,power_law_1.2,1.7288127899169923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,1,power_law_1.2,1.974355125427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,1,power_law_1.2,2.2442880630493165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,1,power_law_1.2,2.5971712112426757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,1,power_law_1.2,2.773088073730469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,1,power_law_1.2,3.399980926513672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,1,power_law_1.2,4.095820617675781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,1,power_law_1.2,5.190675354003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,1,power_law_1.2,6.47996826171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,1,power_law_1.2,7.700371551513672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,1,power_law_1.2,11.088915252685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,1,power_law_1.2,20.74652862548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,power_law_1.01,0.11845120191574096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,power_law_1.01,0.1672063946723938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,power_law_1.01,0.17210880517959595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,power_law_1.01,0.22881920337677003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,power_law_1.01,0.2380671977996826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,power_law_1.01,0.24152960777282714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,power_law_1.2,0.12703360319137574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,power_law_1.01,0.24296960830688477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,power_law_1.01,0.2722687959671021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,power_law_1.2,0.138374400138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,power_law_1.2,0.18158719539642335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,power_law_1.01,0.28762240409851075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,power_law_1.2,0.22643840312957764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,power_law_1.01,0.3070784091949463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,power_law_1.2,0.23381760120391845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,power_law_1.01,0.2655103921890259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,power_law_1.2,0.2395456075668335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,power_law_1.01,0.2829056024551392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,power_law_1.2,0.24611198902130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,power_law_1.01,0.2876287937164307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,power_law_1.2,0.24877440929412842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,power_law_1.01,0.3134335994720459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,power_law_1.2,0.2743680000305176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,power_law_1.01,0.3337088108062744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,power_law_1.2,0.2878783941268921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,power_law_1.01,0.35050239562988283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,power_law_1.2,0.2805056095123291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,power_law_1.01,0.4168447971343994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,power_law_1.2,0.29033598899841306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,power_law_1.01,0.4838143825531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,power_law_1.2,0.28603520393371584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,power_law_1.01,0.616537618637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,power_law_1.2,0.314303994178772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,power_law_1.01,0.7482240200042725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,power_law_1.2,0.3437887907028198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,power_law_1.01,0.9304767608642578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,power_law_1.2,0.3644799947738647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,power_law_1.01,1.2280511856079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,power_law_1.2,0.44905600547790525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,power_law_1.01,1.5096575736999511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,power_law_1.2,0.5125504016876221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,power_law_1.01,2.4939199447631837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,power_law_1.2,0.6100287914276123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,power_law_1.01,3.3673919677734374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,power_law_1.2,0.7998847961425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,power_law_1.01,5.443251037597657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,power_law_1.2,1.1216192245483398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,power_law_1.2,1.48220796585083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,power_law_1.01,6.515167999267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,power_law_1.2,2.023142433166504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,power_law_1.01,8.473267364501954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,power_law_1.2,2.382566452026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,power_law_1.01,17.347474670410158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,power_law_1.2,3.3353153228759767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,power_law_1.2,5.864582443237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,power_law_1.2,8.568576049804687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,power_law_1.01,42.186221313476565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.08225280046463013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,power_law_1.2,11.81484146118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.12343039512634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,power_law_1.01,0.13443200588226317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,power_law_1.2,18.015577697753905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,power_law_1.01,0.2280639886856079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,power_law_1.01,0.2286911964416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,power_law_1.01,0.23893120288848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,power_law_1.2,41.16842956542969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,power_law_1.01,0.25319681167602537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,power_law_1.01,0.2505919933319092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,power_law_1.01,0.2596224069595337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,power_law_1.01,0.27764480113983153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,power_law_1.01,0.24705278873443604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,power_law_1.01,0.26166400909423826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,power_law_1.01,0.26801280975341796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,power_law_1.01,0.280019211769104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,power_law_1.01,0.30563199520111084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,power_law_1.01,0.3052864074707031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,power_law_1.01,0.3259711980819702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,power_law_1.01,0.393503999710083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,power_law_1.01,0.47649922370910647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,power_law_1.01,0.5898943901062011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,power_law_1.01,0.7159103870391845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,power_law_1.01,0.9506112098693847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,power_law_1.01,1.2173952102661132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,power_law_1.01,1.7542463302612306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,power_law_1.01,2.2791488647460936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,power_law_1.01,3.5134654998779298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,power_law_1.2,0.08406400084495544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,power_law_1.2,0.09182080030441284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,power_law_1.01,5.080192184448242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,power_law_1.2,0.1471295952796936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,power_law_1.01,6.354246520996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,power_law_1.2,0.23067519664764405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,power_law_1.2,0.23950719833374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,power_law_1.01,11.119340515136718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,power_law_1.2,0.2419584035873413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,power_law_1.2,0.24380800724029542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,power_law_1.01,23.813478088378908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,power_law_1.2,0.24421119689941406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,power_law_1.2,0.24626560211181642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,power_law_1.2,0.24625918865203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,power_law_1.2,0.2534336090087891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,power_law_1.2,0.26654078960418703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,power_law_1.2,0.26735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,power_law_1.2,0.26817920207977297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,power_law_1.2,0.3056576013565063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,power_law_1.2,0.3109760046005249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,power_law_1.2,0.3318655967712402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,power_law_1.2,0.40764799118041994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,power_law_1.2,0.4567999839782715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,power_law_1.2,0.5669824123382569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,power_law_1.2,0.7207871913909912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,power_law_1.2,0.9776127815246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,power_law_1.2,1.244870376586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,power_law_1.2,1.7832832336425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,power_law_1.2,2.3780288696289062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,power_law_1.2,3.6201408386230467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,power_law_1.2,4.857734298706054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,power_law_1.2,6.084230422973633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,power_law_1.2,12.006642913818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,power_law_1.2,25.9637451171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,power_law_1.01,0.2302783966064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,power_law_1.01,0.2470911979675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,power_law_1.01,0.18297599554061889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,power_law_1.01,0.40436477661132814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,power_law_1.01,0.3845056056976318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,power_law_1.01,0.3863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,power_law_1.01,0.40947837829589845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,power_law_1.01,0.4104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,power_law_1.01,0.41432957649230956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,power_law_1.01,0.42339839935302737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,power_law_1.01,0.4329984188079834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,power_law_1.01,0.4400000095367432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,power_law_1.01,0.46416001319885253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,power_law_1.01,0.46824960708618163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,power_law_1.2,0.2163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,power_law_1.01,0.5481279850006103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,power_law_1.2,0.2715008020401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,power_law_1.2,0.29402880668640136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,power_law_1.01,0.531334400177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,power_law_1.2,0.3874111890792847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,power_law_1.01,0.5927743911743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,power_law_1.2,0.4029888153076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,power_law_1.01,0.774015998840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,power_law_1.2,0.4066624164581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,power_law_1.01,0.897708797454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,power_law_1.2,0.4087103843688965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,power_law_1.01,1.2510016441345215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,power_law_1.2,0.4111743927001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,power_law_1.01,1.4684864044189454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,power_law_1.2,0.4158912181854248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,power_law_1.01,1.9595712661743163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,power_law_1.2,0.4343167781829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,power_law_1.01,2.9307775497436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,power_law_1.2,0.4404736042022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,power_law_1.01,3.8089534759521486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,power_law_1.2,0.45438718795776367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,power_law_1.2,0.4748672008514404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,power_law_1.01,5.262828826904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,power_law_1.2,0.48592000007629393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,power_law_1.01,8.398713684082031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,power_law_1.2,0.5555583953857421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,power_law_1.2,0.5571839809417725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,power_law_1.01,13.66375732421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.12177920341491699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,power_law_1.2,0.5981632232666015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,power_law_1.01,0.15927040576934814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,power_law_1.01,14.424581909179688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,power_law_1.2,0.7781631946563721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,power_law_1.01,0.19408639669418334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,power_law_1.2,0.9571776390075684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,power_law_1.01,0.34787840843200685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,power_law_1.2,1.2342528343200683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,power_law_1.01,0.3743168115615845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,power_law_1.01,28.09578857421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,power_law_1.2,1.4599360466003417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,power_law_1.01,0.38597118854522705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,power_law_1.01,0.3781248092651367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,power_law_1.2,2.5492927551269533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,power_law_1.01,0.3894592046737671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,power_law_1.2,2.9701311111450197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,power_law_1.01,59.75887451171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,power_law_1.01,0.395795202255249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,power_law_1.2,4.699462509155273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,power_law_1.01,0.3982399940490723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,power_law_1.2,6.381670379638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,power_law_1.01,0.395795202255249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,power_law_1.01,0.4226367950439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,power_law_1.2,9.222502136230469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,power_law_1.01,0.4322624206542969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,power_law_1.2,16.558816528320314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,power_law_1.01,0.4230207920074463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,power_law_1.01,0.4728127956390381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,power_law_1.2,18.497068786621092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,power_law_1.01,0.4826367855072021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,power_law_1.01,0.5379392147064209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,power_law_1.01,0.6325568199157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,power_law_1.2,30.575955200195313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,power_law_1.01,0.7142655849456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,power_law_1.01,0.9292799949645996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,power_law_1.01,1.1600447654724122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,power_law_1.01,1.5936832427978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.12051199674606324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,power_law_1.2,62.3336669921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,power_law_1.2,0.1704767942428589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,power_law_1.01,1.9465408325195312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,power_law_1.2,0.24954240322113036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,power_law_1.01,2.9058303833007812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,power_law_1.2,0.3582848072052002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,power_law_1.01,4.184390258789063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,power_law_1.2,0.374451208114624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,power_law_1.01,6.057900619506836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,power_law_1.2,0.3834624052047729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,power_law_1.2,0.38755838871002196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,power_law_1.01,8.609101104736329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,power_law_1.2,0.3935103893280029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,power_law_1.01,10.92968292236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,power_law_1.2,0.39740159511566164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,power_law_1.2,0.40580477714538576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,power_law_1.01,21.37756805419922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,power_law_1.2,0.4039423942565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,power_law_1.2,0.4162303924560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,power_law_1.2,0.41130242347717283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,power_law_1.2,0.4321599960327148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,power_law_1.01,38.988729858398436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,power_law_1.2,0.4785088062286377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,power_law_1.2,0.4916096210479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,power_law_1.2,0.5305215835571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,power_law_1.2,0.6388671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,power_law_1.2,0.7265215873718261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,power_law_1.2,0.9292672157287598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,power_law_1.2,1.1535296440124512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,power_law_1.2,1.5973312377929687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,power_law_1.2,1.997305679321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,power_law_1.2,2.866399955749512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,power_law_1.2,4.147833633422851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,power_law_1.2,6.281235122680664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,power_law_1.2,9.45647964477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,power_law_1.2,11.72545928955078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,power_law_1.2,20.872831726074217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,power_law_1.2,46.8586181640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,power_law_1.01,0.17231359481811523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,power_law_1.01,0.26365439891815184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,power_law_1.01,0.19096319675445556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,power_law_1.01,0.35890560150146483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,power_law_1.01,0.5710591793060302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,power_law_1.01,0.8010496139526367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,power_law_1.01,1.1391807556152345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,power_law_1.01,1.1617088317871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,power_law_1.01,1.1760512351989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,power_law_1.01,1.2780223846435548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,power_law_1.01,1.2866368293762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,power_law_1.01,1.3222720146179199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,power_law_1.01,1.349734401702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,power_law_1.01,1.3996864318847657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,power_law_1.2,0.1674496054649353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,power_law_1.01,1.3853440284729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,power_law_1.2,0.2559360027313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,power_law_1.01,1.4508928298950194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,power_law_1.2,0.1942911982536316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,power_law_1.01,1.4912192344665527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,power_law_1.2,0.343174409866333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,power_law_1.01,1.5977279663085937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,power_law_1.2,0.4715775966644287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,power_law_1.01,1.6640703201293945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,power_law_1.2,0.7253312110900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,power_law_1.01,1.8909887313842773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,power_law_1.2,1.138815975189209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,power_law_1.01,1.925619125366211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,power_law_1.2,1.2072319984436035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,power_law_1.01,2.2131391525268556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,power_law_1.2,1.2207488059997558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,power_law_1.01,2.5520896911621094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,power_law_1.2,1.2858688354492187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,power_law_1.01,3.1701759338378905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,power_law_1.2,1.2797247886657714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,power_law_1.01,3.9305919647216796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,power_law_1.2,1.3563136100769042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,power_law_1.01,5.463321685791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,power_law_1.2,1.3358464241027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,power_law_1.2,1.4484736442565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,power_law_1.01,7.187321472167969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,power_law_1.2,1.5027456283569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,power_law_1.01,8.72128677368164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,power_law_1.2,1.5183103561401368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.11195520162582398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,power_law_1.2,1.5781120300292968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,power_law_1.01,0.16499840021133422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,power_law_1.01,14.45137939453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,power_law_1.2,1.7063104629516601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,power_law_1.01,0.18343039751052856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,power_law_1.01,0.35936000347137453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,power_law_1.2,1.8206144332885743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,power_law_1.01,31.450820922851562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,power_law_1.01,0.5657855987548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,power_law_1.2,1.9625280380249024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,power_law_1.01,0.7822463989257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,power_law_1.2,2.1292287826538088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,power_law_1.01,1.08023681640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,power_law_1.2,2.466124725341797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,power_law_1.01,1.168716812133789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,power_law_1.2,2.700831985473633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,power_law_1.01,1.2145983695983886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,power_law_1.2,3.4250110626220702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,power_law_1.01,1.2477631568908691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,power_law_1.2,4.110252761840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,power_law_1.01,1.2895487785339355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,power_law_1.2,5.472761535644532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,power_law_1.01,1.3530495643615723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,power_law_1.2,7.912646484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,power_law_1.01,1.3956288337707519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,power_law_1.01,1.4333120346069337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,power_law_1.2,9.77154541015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,power_law_1.2,0.1643455982208252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,power_law_1.01,1.4814528465270995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,power_law_1.2,0.19219839572906494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,power_law_1.01,1.5281472206115723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,power_law_1.2,17.860736083984374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,power_law_1.2,0.3369920015335083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,power_law_1.01,1.544934368133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,power_law_1.2,0.48670082092285155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,power_law_1.01,1.6624832153320312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,power_law_1.2,39.5939208984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,power_law_1.2,0.6474688053131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,power_law_1.01,1.7259136199951173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,power_law_1.2,1.090015983581543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,power_law_1.01,1.9481792449951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,power_law_1.2,1.1559743881225586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,power_law_1.01,2.0186304092407226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,power_law_1.2,1.1744064331054687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,power_law_1.01,2.332940864562988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,power_law_1.2,1.2325695991516112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,power_law_1.01,2.7
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,power_law_1.2,1.3103872299194337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,power_law_1.01,3.3766590118408204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,power_law_1.2,1.349715232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,power_law_1.01,4.48524169921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,power_law_1.2,1.4111552238464355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,power_law_1.01,5.967801666259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,power_law_1.2,1.490835189819336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,power_law_1.2,1.5367103576660157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,power_law_1.01,7.64361572265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,power_law_1.2,1.5489855766296388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,power_law_1.01,9.334297943115235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,power_law_1.2,1.6304256439208984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,power_law_1.2,1.748396873474121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,power_law_1.01,15.080525207519532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,power_law_1.2,1.8295616149902343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,power_law_1.2,2.0280256271362305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,power_law_1.01,29.834567260742187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,power_law_1.2,2.0959104537963866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,power_law_1.2,2.4366016387939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,power_law_1.2,2.8283071517944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,power_law_1.2,3.4323200225830077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,power_law_1.2,4.5497791290283205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,power_law_1.2,6.2070976257324215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,power_law_1.2,7.958131408691406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,power_law_1.2,9.843328094482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,power_law_1.2,16.142041015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,power_law_1.2,32.030950927734374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,power_law_1.01,0.08199679851531982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,power_law_1.01,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,power_law_1.01,0.10616320371627808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,power_law_1.01,0.16494079828262329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,power_law_1.01,0.1923840045928955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,power_law_1.01,0.31792640686035156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,power_law_1.01,0.33758718967437745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,power_law_1.01,0.3486720085144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,power_law_1.01,0.35357439517974854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,power_law_1.01,0.3611455917358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,power_law_1.01,0.3689280033111572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,power_law_1.01,0.37281920909881594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,power_law_1.01,0.38368000984191897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,power_law_1.01,0.39432320594787595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,power_law_1.01,0.40517120361328124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,power_law_1.01,0.4111167907714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,power_law_1.01,0.429747200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,power_law_1.01,0.46497278213500975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,power_law_1.01,0.48299517631530764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,power_law_1.01,0.5587647914886474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,power_law_1.2,0.08082559704780579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,power_law_1.01,0.630790376663208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,power_law_1.01,0.7846015930175781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,power_law_1.2,0.10172159671783447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,power_law_1.01,0.9669376373291015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,power_law_1.2,0.1379647970199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,power_law_1.01,1.270860767364502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,power_law_1.2,0.17871999740600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,power_law_1.01,1.4817983627319335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,power_law_1.2,0.3153215885162354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,power_law_1.01,2.1017343521118166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,power_law_1.2,0.3398911952972412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,power_law_1.01,2.768147277832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,power_law_1.2,0.3546560049057007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,power_law_1.2,0.3570879936218262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,power_law_1.01,3.6041473388671874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,power_law_1.2,0.3628351926803589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,power_law_1.01,6.118265533447266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,power_law_1.2,0.37431039810180666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,power_law_1.2,0.3802367925643921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,power_law_1.2,0.37737600803375243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,power_law_1.01,14.292031860351562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,power_law_1.2,0.39315199851989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,power_law_1.2,0.4009088039398193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,power_law_1.2,0.4281599998474121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,power_law_1.2,0.44046721458435056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,power_law_1.2,0.4806015968322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,power_law_1.2,0.5010816097259522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,power_law_1.2,0.578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,power_law_1.2,0.6634751796722412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,power_law_1.2,0.8284735679626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,power_law_1.2,1.0485055923461915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,power_law_1.2,1.3260031700134278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,power_law_1.01,0.059520000219345094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,power_law_1.2,1.601875114440918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,power_law_1.01,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,power_law_1.01,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,power_law_1.2,2.2549760818481444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,power_law_1.01,0.15352959632873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,power_law_1.2,3.0586111068725588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,power_law_1.01,0.19942400455474854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,power_law_1.2,3.925324630737305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,power_law_1.01,0.32186241149902345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,power_law_1.01,0.3501375913619995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,power_law_1.2,6.133900833129883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,power_law_1.01,0.3577215909957886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,power_law_1.01,0.3515712022781372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,power_law_1.2,15.677171325683593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,power_law_1.01,0.3641983985900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,power_law_1.01,0.3708224058151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,power_law_1.01,0.3810688018798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,power_law_1.01,0.3863039970397949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,power_law_1.01,0.3992831945419312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,power_law_1.2,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,power_law_1.01,0.41240320205688474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,power_law_1.2,0.06520959734916687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,power_law_1.01,0.423583984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,power_law_1.2,0.10412800312042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,power_law_1.01,0.4445375919342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,power_law_1.2,0.14057600498199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,power_law_1.01,0.4949183940887451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,power_law_1.2,0.17560319900512694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,power_law_1.01,0.5211328029632568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,power_law_1.2,0.3208127975463867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,power_law_1.01,0.5911871910095214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,power_law_1.2,0.35192320346832273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,power_law_1.01,0.6748735904693604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,power_law_1.2,0.36627840995788574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,power_law_1.01,0.8424063682556152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,power_law_1.2,0.37242879867553713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,power_law_1.01,1.0169599533081055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,power_law_1.2,0.3793728113174438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,power_law_1.01,1.3124863624572753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,power_law_1.2,0.3814271926879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,power_law_1.01,1.6211135864257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,power_law_1.2,0.39146239757537843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,power_law_1.01,2.261529541015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,power_law_1.2,0.4047679901123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,power_law_1.01,3.005753517150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,power_law_1.2,0.41051521301269533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,power_law_1.2,0.42463998794555663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,power_law_1.01,3.6046207427978514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,power_law_1.2,0.4305856227874756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,power_law_1.01,6.135123062133789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,power_law_1.2,0.45351037979125974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,power_law_1.2,0.5133120059967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,power_law_1.01,13.143980407714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,power_law_1.2,0.5317376136779786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,power_law_1.2,0.6058944225311279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,power_law_1.2,0.685152006149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,power_law_1.2,0.8514495849609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,power_law_1.2,1.0214336395263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,power_law_1.2,1.3316991806030274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,power_law_1.2,1.653036880493164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,power_law_1.2,2.3386240005493164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,power_law_1.2,3.0442176818847657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,power_law_1.2,3.720083236694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,power_law_1.2,6.543154907226563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,power_law_1.2,12.15244140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,power_law_1.01,0.18951679468154908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,power_law_1.01,0.2435904026031494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,power_law_1.01,0.21553919315338135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,power_law_1.01,0.3468096017837524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,power_law_1.01,0.4629312038421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,power_law_1.01,0.8583935737609864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,power_law_1.01,0.9034560203552247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,power_law_1.01,0.9571136474609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,power_law_1.01,0.9726783752441406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,power_law_1.01,0.9673600196838379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,power_law_1.01,1.00381441116333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,power_law_1.01,1.0410752296447754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,power_law_1.01,1.046412754058838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,power_law_1.01,1.0386240005493164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,power_law_1.01,1.095353603363037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,power_law_1.01,1.10763521194458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,power_law_1.01,1.149772834777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,power_law_1.01,1.2374784469604492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,power_law_1.01,1.409932804107666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,power_law_1.01,1.6595775604248046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,power_law_1.01,1.6345855712890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,power_law_1.01,1.9182336807250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,power_law_1.2,0.1969472050666809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,power_law_1.01,2.3771903991699217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,power_law_1.2,0.15025919675827026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,power_law_1.2,0.2006335973739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,power_law_1.01,3.02044792175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,power_law_1.2,0.3259711980819702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,power_law_1.01,4.199910354614258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,power_law_1.2,0.478547191619873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,power_law_1.01,5.744895935058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,power_law_1.2,0.8334591865539551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,power_law_1.2,0.9456959724426269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,power_law_1.01,7.771635437011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,power_law_1.2,0.9157695770263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,power_law_1.01,10.10921630859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,power_law_1.2,0.9927935600280762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,power_law_1.2,1.0349184036254884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,power_law_1.01,17.368524169921876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,power_law_1.2,1.045644760131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,power_law_1.2,1.076159954071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,power_law_1.2,1.0843135833740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,power_law_1.01,35.456103515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,power_law_1.2,1.0949312210083009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,power_law_1.2,1.105241584777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,power_law_1.2,1.171180820465088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,power_law_1.2,1.1924863815307618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,power_law_1.2,1.285465621948242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,power_law_1.2,1.5060159683227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,power_law_1.2,1.8140607833862306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,power_law_1.2,1.7345216751098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,power_law_1.2,1.985055923461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,power_law_1.2,2.5693504333496096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,power_law_1.2,3.1743423461914064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,power_law_1.2,4.680646514892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,power_law_1.2,6.511545562744141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,power_law_1.2,8.629491424560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.11175040006637574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,power_law_1.2,10.047411346435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,power_law_1.01,0.15271040201187133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,power_law_1.01,0.22213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,power_law_1.2,17.79295959472656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,power_law_1.01,0.3683520078659058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,power_law_1.01,0.4916543960571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,power_law_1.01,0.8428863525390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,power_law_1.2,35.763134765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,power_law_1.01,0.9001600265502929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,power_law_1.01,0.9226880073547363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,power_law_1.01,0.9452863693237304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,power_law_1.01,0.9674112319946289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,power_law_1.01,1.0202431678771973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,power_law_1.01,1.0431872367858888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.11887359619140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,power_law_1.2,0.12379519939422608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,power_law_1.01,1.0316991806030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,power_law_1.2,0.20816640853881835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,power_law_1.01,1.076972770690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,power_law_1.2,0.31221120357513427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,power_law_1.01,1.0981632232666017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,power_law_1.2,0.4387648105621338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,power_law_1.01,1.1428544044494628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,power_law_1.2,0.8125184059143067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,power_law_1.01,1.199852752685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,power_law_1.2,0.9017919540405274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,power_law_1.01,1.2977472305297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,power_law_1.2,0.9563072204589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,power_law_1.01,1.3440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,power_law_1.2,0.9784064292907715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,power_law_1.01,1.544927978515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,power_law_1.2,1.0165184020996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,power_law_1.01,1.6321792602539062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,power_law_1.2,1.056447982788086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,power_law_1.01,1.9923648834228516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,power_law_1.2,1.075692844390869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,power_law_1.01,2.8390655517578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,power_law_1.2,1.0728192329406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,power_law_1.01,3.6119808197021483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,power_law_1.2,1.1141632080078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,power_law_1.01,4.317926406860352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,power_law_1.2,1.1469759941101074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,power_law_1.01,5.821977615356445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,power_law_1.2,1.1920063972473145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,power_law_1.2,1.2329919815063477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,power_law_1.01,7.2746429443359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,power_law_1.2,1.3849535942077638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,power_law_1.01,9.289651489257812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,power_law_1.2,1.4447360038757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,power_law_1.2,1.6513856887817382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,power_law_1.01,15.292767333984376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,power_law_1.2,1.6571136474609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,power_law_1.2,1.9944255828857422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,power_law_1.2,2.414476776123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,power_law_1.01,27.81507263183594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,power_law_1.2,3.0884607315063475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,power_law_1.2,4.416704177856445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,power_law_1.2,6.035737609863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,power_law_1.2,7.738470458984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,power_law_1.2,9.736217498779297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,power_law_1.2,16.25708770751953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,power_law_1.2,35.094546508789065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,power_law_1.01,0.1708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,power_law_1.01,0.2661119937896729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,power_law_1.01,0.4616703987121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,power_law_1.01,0.3193599939346313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,power_law_1.01,0.6351615905761718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,power_law_1.01,0.9403264045715332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,power_law_1.01,1.105510425567627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,power_law_1.01,1.538259220123291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,power_law_1.01,1.5596287727355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,power_law_1.01,1.6251775741577148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,power_law_1.01,1.722662353515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,power_law_1.01,1.788198471069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,power_law_1.01,1.8303808212280273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,power_law_1.01,1.9206975936889648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,power_law_1.01,1.9256063461303712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,power_law_1.01,1.949772834777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,power_law_1.01,2.026790428161621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,power_law_1.01,2.1607295989990236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,power_law_1.01,2.227884864807129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,power_law_1.01,2.45665283203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,power_law_1.2,0.16622719764709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,power_law_1.2,0.26495358943939207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,power_law_1.01,2.647929573059082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,power_law_1.2,0.2825536012649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,power_law_1.01,3.0838911056518556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,power_law_1.2,0.29770240783691404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,power_law_1.01,3.124095916748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,power_law_1.2,0.5608831882476807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,power_law_1.01,3.702035140991211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,power_law_1.2,0.8244480133056641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,power_law_1.01,5.574732971191406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,power_law_1.2,0.987065601348877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,power_law_1.01,6.936460876464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,power_law_1.2,1.4512831687927246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,power_law_1.2,1.5125887870788575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,power_law_1.01,8.134732818603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,power_law_1.2,1.590828800201416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,power_law_1.01,10.021971130371094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,power_law_1.2,1.6550527572631837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,power_law_1.2,1.7718591690063477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,power_law_1.01,14.731756591796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,power_law_1.2,1.7857856750488281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,power_law_1.2,1.8304384231567383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,power_law_1.01,34.18719482421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,power_law_1.2,1.9006080627441406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,power_law_1.2,1.9543487548828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,power_law_1.2,2.034617614746094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,power_law_1.2,2.2762880325317383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,power_law_1.2,2.2472000122070312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,power_law_1.2,2.5709056854248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,power_law_1.2,2.7870527267456056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,power_law_1.2,3.244755172729492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,power_law_1.2,3.3602878570556642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,power_law_1.2,4.026297760009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,power_law_1.2,4.977395248413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,power_law_1.2,6.4814399719238285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,power_law_1.2,8.681196594238282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,power_law_1.2,10.918227386474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,power_law_1.2,16.986656188964844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,power_law_1.01,0.1707327961921692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,power_law_1.01,0.26676480770111083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,power_law_1.2,35.404928588867186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,power_law_1.01,0.33703041076660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,power_law_1.01,0.635155200958252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,power_law_1.01,0.9509504318237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,power_law_1.01,1.1326784133911132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,power_law_1.01,1.469375991821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,power_law_1.01,1.5965503692626952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.1145792007446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,power_law_1.01,1.6051456451416015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,power_law_1.2,0.17089920043945311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,power_law_1.01,1.6747711181640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,power_law_1.2,0.21553919315338135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,power_law_1.01,1.791116714477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,power_law_1.2,0.31324799060821534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,power_law_1.01,1.8287935256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,power_law_1.2,0.5587647914886474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,power_law_1.2,0.7932799816131592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,power_law_1.01,1.8603328704833983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,power_law_1.2,0.9726847648620606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,power_law_1.01,1.9858047485351562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,power_law_1.2,1.402079963684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,power_law_1.01,1.9707263946533202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,power_law_1.2,1.4730175971984862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,power_law_1.01,2.050182342529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,power_law_1.2,1.543673610687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,power_law_1.01,2.2197568893432615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,power_law_1.2,1.6427904129028321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,power_law_1.01,2.3255680084228514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,power_law_1.2,1.718547248840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,power_law_1.01,2.5447744369506835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,power_law_1.2,1.7758975982666017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,power_law_1.01,2.6840255737304686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,power_law_1.2,1.8332416534423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,power_law_1.01,3.1412864685058595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,power_law_1.2,1.9727296829223633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,power_law_1.01,3.540019226074219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,power_law_1.2,2.0156671524047853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,power_law_1.01,4.38592643737793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,power_law_1.2,2.1377792358398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,power_law_1.01,5.7674816131591795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,power_law_1.2,2.2745855331420897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,power_law_1.01,7.217683410644531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,power_law_1.2,2.3498559951782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,power_law_1.01,8.54909439086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,power_law_1.2,2.638047981262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,power_law_1.2,2.834521675109863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,power_law_1.01,10.230028533935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,power_law_1.2,3.3147647857666014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,power_law_1.01,16.720217895507812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,power_law_1.2,3.7561153411865233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,power_law_1.2,4.574496078491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,power_law_1.01,34.07761840820312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,power_law_1.2,6.001311874389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,power_law_1.2,7.668402862548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,power_law_1.2,8.953542327880859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,power_law_1.2,11.45879669189453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,power_law_1.2,16.14228515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,power_law_1.01,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,power_law_1.01,0.10862079858779908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,power_law_1.2,35.403628540039065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,power_law_1.01,0.09470080137252808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,power_law_1.01,0.14056960344314576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,power_law_1.01,0.141593599319458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,power_law_1.01,0.14425599575042725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,power_law_1.01,0.1356608033180237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,power_law_1.01,0.15900800228118897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,power_law_1.01,0.16064640283584594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,power_law_1.01,0.16147199869155884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,power_law_1.01,0.15736960172653197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,power_law_1.01,0.16350719928741456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,power_law_1.01,0.16473599672317504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,power_law_1.01,0.18522239923477174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,power_law_1.01,0.20037760734558105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,power_law_1.01,0.23069438934326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,power_law_1.01,0.24195199012756347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,power_law_1.01,0.29356799125671384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,power_law_1.01,0.36217598915100097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,power_law_1.01,0.41091198921203614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,power_law_1.01,0.5129024028778076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,power_law_1.01,0.7748288154602051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,power_law_1.01,0.9542400360107421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,power_law_1.01,1.4578432083129882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,power_law_1.01,1.8537216186523438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,power_law_1.01,2.7939584732055662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,power_law_1.01,4.116767883300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,power_law_1.01,5.040825653076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,power_law_1.01,6.981260681152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,power_law_1.2,0.08718079924583436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,power_law_1.01,17.654054260253908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,power_law_1.2,0.0974016010761261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,power_law_1.2,0.09292160272598267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,power_law_1.2,0.12608640193939208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,power_law_1.2,0.14123519659042358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,power_law_1.2,0.14288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,power_law_1.2,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,power_law_1.2,0.15455360412597657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,power_law_1.2,0.15516799688339233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,power_law_1.2,0.15886720418930053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,power_law_1.2,0.16173440217971802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,power_law_1.2,0.1670464038848877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,power_law_1.2,0.17073919773101806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,power_law_1.2,0.1879487991333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,power_law_1.2,0.20719358921051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,power_law_1.2,0.21251840591430665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,power_law_1.2,0.2524480104446411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,power_law_1.2,0.3026367902755737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,power_law_1.2,0.3429696083068848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,power_law_1.2,0.4166975975036621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,power_law_1.2,0.5838143825531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,power_law_1.2,0.7699135780334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,power_law_1.2,1.1461888313293458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,power_law_1.2,1.5011263847351075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,power_law_1.2,1.829587173461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,power_law_1.2,2.8824256896972655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,power_law_1.2,3.559756851196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,power_law_1.2,5.072832107543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,power_law_1.2,9.278591918945313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,power_law_1.2,19.430067443847655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,power_law_1.01,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,power_law_1.01,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,power_law_1.01,0.13346560001373292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,power_law_1.01,0.13713279962539673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,power_law_1.01,0.13838080167770386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,power_law_1.01,0.14288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,power_law_1.01,0.14410879611968994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,power_law_1.01,0.14821120500564575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,power_law_1.01,0.14820480346679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,power_law_1.01,0.1510591983795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,power_law_1.01,0.15230079889297485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,power_law_1.01,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,power_law_1.2,0.06172800064086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,power_law_1.01,0.1707327961921692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,power_law_1.2,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,power_law_1.01,0.1854848027229309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,power_law_1.2,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,power_law_1.01,0.1866943955421448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,power_law_1.2,0.13874560594558716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,power_law_1.01,0.20349440574645997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,power_law_1.2,0.13628159761428832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,power_law_1.01,0.24343039989471435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,power_law_1.01,0.27844479084014895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,power_law_1.2,0.14365439414978026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,power_law_1.01,0.35403521060943605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,power_law_1.2,0.1454975962638855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,power_law_1.01,0.42469120025634766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,power_law_1.2,0.1469375967979431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,power_law_1.01,0.5751488208770752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,power_law_1.2,0.148364794254303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,power_law_1.01,0.715500783920288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,power_law_1.2,0.15164799690246583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,power_law_1.2,0.1552575945854187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,power_law_1.01,0.997708797454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,power_law_1.2,0.15718400478363037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,power_law_1.01,1.2817728042602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,power_law_1.2,0.16639360189437866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,power_law_1.01,1.859507179260254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,power_law_1.2,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,power_law_1.01,2.5144447326660155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,power_law_1.2,0.18810240030288697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,power_law_1.01,3.190297508239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,power_law_1.2,0.20407679080963134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,power_law_1.2,0.2403264045715332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,power_law_1.01,5.157996749877929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,power_law_1.2,0.28557438850402833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,power_law_1.01,10.946489715576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,power_law_1.2,0.3548095941543579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,power_law_1.2,0.42527360916137696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,power_law_1.2,0.5747647762298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,power_law_1.2,0.7047359943389893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,power_law_1.2,1.0102784156799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,power_law_1.2,1.2936127662658692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,power_law_1.2,1.9263744354248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,power_law_1.2,2.5648000717163084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,power_law_1.2,3.323731231689453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,power_law_1.2,5.712921524047852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,power_law_1.2,11.324658966064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,power_law_1.01,0.12131839990615845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,power_law_1.01,0.13032959699630736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,power_law_1.01,0.16883200407028198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,power_law_1.01,0.22064640522003173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,power_law_1.01,0.2167680025100708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,power_law_1.01,0.21777920722961425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,power_law_1.01,0.2191551923751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,power_law_1.01,0.2270143985748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,power_law_1.01,0.23007359504699706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,power_law_1.01,0.2343679904937744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,power_law_1.01,0.23189759254455566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,power_law_1.01,0.24419839382171632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,power_law_1.01,0.2538367986679077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,power_law_1.01,0.26426239013671876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,power_law_1.01,0.2933311939239502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,power_law_1.01,0.31296639442443847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,power_law_1.01,0.329804801940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,power_law_1.01,0.3961600065231323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,power_law_1.01,0.5178112030029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,power_law_1.01,0.6486911773681641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,power_law_1.01,0.7985407829284668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,power_law_1.01,1.13754243850708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,power_law_1.01,1.3484800338745118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,power_law_1.01,1.8618431091308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,power_law_1.01,2.3415552139282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,power_law_1.01,4.205036926269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,power_law_1.01,5.600537490844727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,power_law_1.01,8.35244140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,power_law_1.01,14.761260986328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,power_law_1.2,0.13059840202331544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,power_law_1.2,0.13141119480133057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,power_law_1.01,28.932583618164063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,power_law_1.2,0.13685120344161988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,power_law_1.2,0.21682560443878174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,power_law_1.2,0.20760960578918458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,power_law_1.2,0.21825919151306153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,power_law_1.2,0.21967999935150145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,power_law_1.2,0.2266495943069458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,power_law_1.2,0.23496320247650146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,power_law_1.2,0.241593599319458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,power_law_1.2,0.23955199718475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,power_law_1.2,0.2551104068756104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,power_law_1.2,0.2512255907058716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,power_law_1.2,0.2751807928085327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,power_law_1.2,0.29750399589538573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,power_law_1.2,0.32184319496154784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,power_law_1.2,0.34767999649047854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,power_law_1.2,0.46372480392456056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,power_law_1.2,0.5182911872863769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,power_law_1.2,0.631763219833374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,power_law_1.2,0.8260928153991699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,power_law_1.2,1.1470144271850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,power_law_1.2,1.7545856475830077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,power_law_1.2,2.3227712631225588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,power_law_1.2,2.810745620727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,power_law_1.2,4.115935897827148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,power_law_1.2,6.200255966186523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,power_law_1.2,9.095065307617187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,power_law_1.2,15.925996398925781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,power_law_1.2,38.46320495605469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,power_law_1.01,0.08062719702720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,power_law_1.01,0.11421439647674561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,power_law_1.01,0.13018879890441895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,power_law_1.01,0.21128320693969727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,power_law_1.01,0.20635519027709961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,power_law_1.01,0.21436800956726074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,power_law_1.01,0.21722240447998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,power_law_1.01,0.2178368091583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,power_law_1.01,0.22132480144500732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,power_law_1.01,0.22023680210113525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,power_law_1.01,0.22329599857330323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,power_law_1.01,0.22930560111999512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,power_law_1.01,0.2336064100265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,power_law_1.2,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,power_law_1.01,0.24876160621643068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,power_law_1.2,0.10513919591903687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,power_law_1.2,0.11355520486831665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,power_law_1.01,0.27886080741882324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,power_law_1.2,0.2014143943786621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,power_law_1.01,0.2853951930999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,power_law_1.2,0.1997760057449341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,power_law_1.01,0.3120448112487793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,power_law_1.2,0.2155456066131592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,power_law_1.01,0.36036479473114014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,power_law_1.2,0.21676158905029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,power_law_1.01,0.4301504135131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,power_law_1.2,0.21799039840698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,power_law_1.01,0.5399231910705566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,power_law_1.2,0.21595520973205568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,power_law_1.01,0.6385024070739747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,power_law_1.2,0.22128639221191407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,power_law_1.01,0.8492287635803223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,power_law_1.2,0.2249664068222046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,power_law_1.01,1.0843456268310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,power_law_1.2,0.23888640403747557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,power_law_1.01,1.5187135696411134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,power_law_1.2,0.2380608081817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,power_law_1.01,1.9640832901000977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,power_law_1.2,0.2517888069152832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,power_law_1.01,2.9148223876953123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,power_law_1.2,0.27307519912719724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,power_law_1.01,3.891328048706055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,power_law_1.2,0.28455679416656493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,power_law_1.2,0.3043584108352661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,power_law_1.01,5.136307144165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,power_law_1.2,0.3644160032272339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,power_law_1.01,8.312761688232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,power_law_1.2,0.41584000587463377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,power_law_1.2,0.520691204071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,power_law_1.01,20.502252197265626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,power_law_1.2,0.6600704193115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,power_law_1.2,0.8883071899414062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,power_law_1.2,1.0806143760681153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,power_law_1.2,1.5293439865112304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,power_law_1.2,2.000992012023926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,power_law_1.2,3.0154111862182615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,power_law_1.2,4.357952117919922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,power_law_1.2,5.6982463836669925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,power_law_1.2,9.160569763183593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,power_law_1.2,21.05531463623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,power_law_1.01,0.11088000535964966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,power_law_1.01,0.16842880249023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,power_law_1.01,0.14017280340194702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,power_law_1.01,0.21777920722961425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,power_law_1.01,0.30215680599212646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,power_law_1.01,0.42339839935302737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,power_law_1.01,0.6259520053863525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,power_law_1.01,0.6433536052703858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,power_law_1.01,0.6736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,power_law_1.01,0.6888256072998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,power_law_1.01,0.7269248008728028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,power_law_1.01,0.7219327926635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,power_law_1.01,0.7547584056854248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,power_law_1.01,0.7465727806091309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,power_law_1.01,0.783846378326416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,power_law_1.01,0.7981760025024414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,power_law_1.01,0.8407808303833008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,power_law_1.01,0.9001791954040528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,power_law_1.01,0.9431872367858887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,power_law_1.01,1.0431232452392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,power_law_1.01,1.1461248397827148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,power_law_1.01,1.3099776268005372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,power_law_1.01,1.567795181274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,power_law_1.01,1.9157695770263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,power_law_1.2,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,power_law_1.01,2.348934364318848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,power_law_1.2,0.16110719442367555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,power_law_1.2,0.13326079845428468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,power_law_1.01,3.145369529724121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,power_law_1.2,0.20903680324554444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,power_law_1.01,4.328531265258789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,power_law_1.2,0.2835903882980347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,power_law_1.01,5.107577514648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,power_law_1.2,0.38372480869293213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,power_law_1.2,0.5780799865722657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,power_law_1.01,7.701996612548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,power_law_1.2,0.6276480197906494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,power_law_1.2,0.6649663925170899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,power_law_1.01,18.22109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,power_law_1.2,0.6946176052093506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,power_law_1.2,0.6753600120544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,power_law_1.2,0.6995327949523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,power_law_1.2,0.7388415813446045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,power_law_1.2,0.7687232017517089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,power_law_1.2,0.7789887905120849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,power_law_1.2,0.8359359741210938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,power_law_1.2,0.8559935569763184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,power_law_1.2,0.9284928321838379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,power_law_1.2,0.996070384979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,power_law_1.2,1.0990976333618163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,power_law_1.2,1.1837759971618653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,power_law_1.2,1.400556755065918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,power_law_1.2,1.619481658935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,power_law_1.2,1.994476890563965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,power_law_1.2,2.4509695053100584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,power_law_1.2,3.295571136474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,power_law_1.2,4.349887847900391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,power_law_1.2,4.742483139038086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,power_law_1.2,9.324044799804687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,power_law_1.2,16.564556884765626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,power_law_1.01,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,power_law_1.01,0.08798720240592957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,power_law_1.01,0.05742719769477844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,power_law_1.01,0.11463040113449097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,power_law_1.01,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,power_law_1.01,0.13509759902954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,power_law_1.01,0.10042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,power_law_1.01,0.2204927921295166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,power_law_1.01,0.12561919689178466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,power_law_1.01,0.18275840282440187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,power_law_1.01,0.3220799922943115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,power_law_1.01,0.19423359632492065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,power_law_1.01,0.42712960243225095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,power_law_1.01,0.20325760841369628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,power_law_1.01,0.6002048015594482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,power_law_1.01,0.2026304006576538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,power_law_1.01,0.6520063877105713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,power_law_1.2,0.08815360069274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,power_law_1.01,0.21101438999176025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,power_law_1.01,0.68886399269104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,power_law_1.2,0.11478400230407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,power_law_1.01,0.21532158851623534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,power_law_1.01,0.6921279907226563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,power_law_1.2,0.1274623990058899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,power_law_1.01,0.22206718921661378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,power_law_1.01,0.224947190284729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,power_law_1.01,0.7114048004150391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,power_law_1.2,0.19791359901428224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,power_law_1.01,0.22945919036865234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,power_law_1.2,0.2966464042663574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,power_law_1.01,0.7507199764251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,power_law_1.01,0.23804159164428712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,power_law_1.2,0.3846976041793823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,power_law_1.01,0.7478528022766113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,power_law_1.01,0.24952321052551268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,power_law_1.2,0.5817215919494629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,power_law_1.01,0.7818304061889648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,power_law_1.01,0.26182401180267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,power_law_1.2,0.6128448009490967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,power_law_1.01,0.7883967876434326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,power_law_1.01,0.2843264102935791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,power_law_1.2,0.6785791873931885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,power_law_1.01,0.8322303771972657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,power_law_1.01,0.30461440086364744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,power_law_1.2,0.6888383865356446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,power_law_1.01,0.854758358001709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,power_law_1.01,0.3531519889831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,power_law_1.01,0.41132159233093263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,power_law_1.2,0.7154560089111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,power_law_1.01,0.9399552345275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,power_law_1.01,0.5251967906951904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,power_law_1.2,0.7580543994903565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,power_law_1.01,1.007532787322998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,power_law_1.01,0.6337088108062744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,power_law_1.2,0.7789184093475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,power_law_1.01,1.1465855598449708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,power_law_1.01,0.8198847770690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,power_law_1.2,0.7977727890014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,power_law_1.01,1.2334336280822753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,power_law_1.2,0.05767679810523987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,power_law_1.01,0.9968319892883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,power_law_1.2,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,power_law_1.2,0.7977791786193847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,power_law_1.01,1.4656767845153809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,power_law_1.01,1.4656319618225098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,power_law_1.2,0.09271680116653443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,power_law_1.2,0.8894911766052246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,power_law_1.01,1.7021696090698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,power_law_1.2,0.11319680213928222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,power_law_1.01,1.7914560317993165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,power_law_1.2,0.9030464172363282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,power_law_1.01,2.156255912780762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,power_law_1.2,0.175654399394989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,power_law_1.01,2.2438655853271485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,power_law_1.2,0.9939711570739747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,power_law_1.01,2.6070207595825194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,power_law_1.2,0.19039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,power_law_1.2,1.0308544158935546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,power_law_1.01,3.883494567871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,power_law_1.2,0.20126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,power_law_1.01,3.5618049621582033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,power_law_1.2,1.186291217803955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,power_law_1.2,0.21560320854187012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,power_law_1.01,4.757632064819336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,power_law_1.01,7.246310424804688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,power_law_1.2,0.20799999237060546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,power_law_1.2,1.271667194366455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,power_law_1.2,0.2235647916793823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,power_law_1.01,5.778982543945313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,power_law_1.2,1.4965696334838867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,power_law_1.2,0.22111361026763915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,power_law_1.2,1.747225570678711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,power_law_1.01,8.922444915771484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,power_law_1.2,0.23094398975372316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,power_law_1.2,2.197177505493164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,power_law_1.2,0.23216640949249268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,power_law_1.2,0.2424191951751709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,power_law_1.2,2.743110466003418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,power_law_1.01,17.982386779785156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,power_law_1.2,0.24712960720062255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,power_law_1.2,3.653299331665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,power_law_1.2,0.2604351997375488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,power_law_1.2,4.8954113006591795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,power_law_1.2,0.2981247901916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,power_law_1.2,0.3128767967224121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,power_law_1.2,5.935801696777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,power_law_1.2,0.3677567958831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,power_law_1.2,0.4197247982025146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,power_law_1.2,9.685011291503907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,power_law_1.2,0.5301504135131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,power_law_1.2,0.631328010559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,power_law_1.2,16.695558166503908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,power_law_1.2,0.8583616256713867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,power_law_1.2,1.1212032318115235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,power_law_1.2,1.5288960456848144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,power_law_1.2,1.9187135696411133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,power_law_1.2,2.3141759872436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,power_law_1.2,3.6607295989990236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,power_law_1.2,7.807469177246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,power_law_1.01,0.04799999892711639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,power_law_1.01,0.05415679812431336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,power_law_1.01,0.07994880080223084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,power_law_1.01,0.1041152000427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,power_law_1.01,0.12749439477920532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,power_law_1.01,0.19219199419021607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,power_law_1.01,0.20098559856414794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,power_law_1.2,0.045388799905776975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,power_law_1.01,0.21144320964813232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,power_law_1.2,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,power_law_1.01,0.2130687952041626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,power_law_1.01,0.22004480361938478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,power_law_1.2,0.09249280095100403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,power_law_1.01,0.2370368003845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,power_law_1.2,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,power_law_1.01,0.2488640069961548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,power_law_1.2,0.19367040395736695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,power_law_1.01,0.25484800338745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,power_law_1.2,0.20677759647369384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,power_law_1.01,0.25689599514007566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,power_law_1.2,0.21742720603942872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,power_law_1.01,0.27879040241241454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,power_law_1.2,0.22070400714874266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,power_law_1.01,0.2896640062332153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,power_law_1.2,0.22191998958587647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,power_law_1.01,0.2773823976516724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,power_law_1.2,0.22807679176330567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,power_law_1.01,0.32359039783477783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,power_law_1.2,0.23300480842590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,power_law_1.01,0.3461888074874878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,power_law_1.2,0.23975040912628173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,power_law_1.01,0.4260416030883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,power_law_1.2,0.25038719177246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,power_law_1.01,0.481766414642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,power_law_1.2,0.2567487955093384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,power_law_1.01,0.6288064002990723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,power_law_1.2,0.26740479469299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,power_law_1.01,0.7637824058532715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,power_law_1.2,0.2854207992553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,power_law_1.01,1.0242815971374513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,power_law_1.2,0.3323199987411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,power_law_1.01,1.2688128471374511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,power_law_1.2,0.35199999809265137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,power_law_1.01,1.787775993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,power_law_1.2,0.4308288097381592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,power_law_1.01,2.37392635345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,power_law_1.2,0.48142080307006835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,power_law_1.2,0.6198463916778565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,power_law_1.01,2.8467647552490236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,power_law_1.2,0.764249610900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,power_law_1.01,4.444236755371094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,power_law_1.2,1.015718364715576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,power_law_1.2,1.2534848213195802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,power_law_1.01,8.77364501953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,power_law_1.2,1.7431232452392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,power_law_1.2,2.2275264739990233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,power_law_1.2,2.7787071228027345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,power_law_1.2,4.366400146484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,power_law_1.2,8.697984313964843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,power_law_1.01,0.11805440187454223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,power_law_1.01,0.15792640447616577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,power_law_1.01,0.1491711974143982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,power_law_1.01,0.1950592041015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,power_law_1.01,0.28886399269104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,power_law_1.01,0.46581120491027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,power_law_1.01,0.48629121780395507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,power_law_1.01,0.5182400226593018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,power_law_1.01,0.5309311866760253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,power_law_1.01,0.5325503826141358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,power_law_1.2,0.10990079641342163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,power_law_1.01,0.5362495899200439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,power_law_1.2,0.1011072039604187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,power_law_1.01,0.560422420501709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,power_law_1.2,0.13427200317382812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,power_law_1.01,0.5743423938751221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,power_law_1.2,0.1764032006263733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,power_law_1.01,0.5763967990875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,power_law_1.2,0.2573632001876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,power_law_1.01,0.6017983913421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,power_law_1.2,0.4535679817199707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,power_law_1.01,0.6013696193695068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,power_law_1.2,0.4728127956390381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,power_law_1.01,0.6388480186462402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,power_law_1.2,0.5072319984436036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,power_law_1.2,0.5309823989868164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,power_law_1.01,0.683513593673706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,power_law_1.2,0.5391744136810303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,power_law_1.01,0.7387904167175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,power_law_1.2,0.5682623863220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,power_law_1.01,0.860051155090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,power_law_1.2,0.5776447772979736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,power_law_1.01,0.8920063972473145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,power_law_1.2,0.554310417175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,power_law_1.01,1.082259178161621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,power_law_1.2,0.6153471946716309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,power_law_1.01,1.3279423713684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,power_law_1.2,0.6401408195495606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,power_law_1.01,1.675494384765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,power_law_1.2,0.6704383850097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,power_law_1.01,2.0988927841186524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,power_law_1.2,0.645465612411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,power_law_1.01,2.947353553771973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,power_law_1.2,0.7196032047271729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,power_law_1.01,4.1003776550292965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,power_law_1.2,0.7949567794799804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,power_law_1.01,4.751436614990235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,power_law_1.2,0.9702719688415528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,power_law_1.2,0.9203071594238281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,power_law_1.01,7.6237632751464846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,power_law_1.2,1.1715840339660644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,power_law_1.2,1.419814395904541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,power_law_1.01,16.176422119140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,power_law_1.2,1.8745983123779297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,power_law_1.2,2.16693115234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,power_law_1.2,3.0696128845214843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,power_law_1.2,4.226528167724609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,power_law_1.2,5.360979080200195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,power_law_1.2,8.741343688964843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,power_law_1.2,17.68892822265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,power_law_1.01,0.088755202293396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,power_law_1.01,0.10862079858779908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,power_law_1.01,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,power_law_1.01,0.21534080505371095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,power_law_1.01,0.2904831886291504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,power_law_1.01,0.46949119567871095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,power_law_1.01,0.4998015880584717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,power_law_1.01,0.5284736156463623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,power_law_1.2,0.08675839900970458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,power_law_1.01,0.5280576229095459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,power_law_1.01,0.5505856037139892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,power_law_1.2,0.13345919847488402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,power_law_1.01,0.5731135845184326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,power_law_1.2,0.18793599605560302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,power_law_1.01,0.5911295890808106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,power_law_1.2,0.25102078914642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,power_law_1.01,0.5976831912994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,power_law_1.01,0.6082623958587646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,power_law_1.01,0.6239039897918701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,power_law_1.01,0.6441792011260986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,power_law_1.01,0.6728447914123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,power_law_1.01,0.74617600440979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,power_law_1.01,0.8198911666870117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,power_law_1.01,0.9603839874267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,power_law_1.01,0.987820816040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,power_law_1.01,1.2149567604064941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,power_law_1.01,1.480172824859619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,power_law_1.01,1.909619140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,power_law_1.01,2.330483245849609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,power_law_1.01,3.2553791046142577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,power_law_1.01,4.233023834228516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,power_law_1.01,5.1881664276123045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,power_law_1.01,7.986061096191406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,power_law_1.01,19.011392211914064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,power_law_1.01,0.11314560174942016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,power_law_1.01,0.16475520133972169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,power_law_1.01,0.2618304014205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,power_law_1.01,0.19151359796524048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,power_law_1.01,0.3623872041702271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,power_law_1.01,0.5395328044891358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,power_law_1.01,0.5993279933929443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,power_law_1.01,0.7826303958892822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,power_law_1.01,0.8459136009216308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,power_law_1.2,0.10867840051651001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,power_law_1.01,0.8719231605529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,power_law_1.2,0.16539520025253296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,power_law_1.01,0.900607967376709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,power_law_1.2,0.1690816044807434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,power_law_1.01,0.9173952102661133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,power_law_1.2,0.19816960096359254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,power_law_1.01,0.9714624404907226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,power_law_1.2,0.3227008104324341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,power_law_1.2,0.4682432174682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,power_law_1.01,1.0005375862121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,power_law_1.2,0.5444928169250488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,power_law_1.01,1.0275584220886231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,power_law_1.2,0.7392704010009765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,power_law_1.01,1.0576831817626953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,power_law_1.2,0.813804817199707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,power_law_1.01,1.0736448287963867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,power_law_1.2,0.833465576171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,power_law_1.01,1.1604928016662597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,power_law_1.2,0.9071935653686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,power_law_1.01,1.229708766937256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,power_law_1.2,0.9219519615173339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,power_law_1.01,1.3456255912780761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,power_law_1.2,0.9502143859863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,power_law_1.01,1.4696576118469238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,power_law_1.2,0.9908608436584473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,power_law_1.01,1.6649087905883788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,power_law_1.2,1.031315231323242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,power_law_1.01,1.8021312713623048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,power_law_1.2,1.0569087982177734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,power_law_1.01,2.29180793762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,power_law_1.2,1.1232192039489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,power_law_1.01,2.644191932678223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,power_law_1.2,1.167910385131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,power_law_1.01,3.5461505889892577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,power_law_1.2,1.2539263725280763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,power_law_1.01,4.821465682983399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,power_law_1.2,1.411616039276123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,power_law_1.01,5.649695968627929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,power_law_1.2,1.610086441040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,power_law_1.2,1.8685056686401367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,power_law_1.01,8.866207885742188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,power_law_1.2,1.9293504714965821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,power_law_1.2,2.3383487701416015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,power_law_1.01,18.323744201660155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,power_law_1.2,2.9111743927001954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,power_law_1.2,3.6635265350341797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,power_law_1.2,4.869247817993164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,power_law_1.2,5.952243041992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,power_law_1.2,8.508966064453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,power_law_1.2,18.256947326660157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,2,power_law_1.01,0.04559360146522522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,2,power_law_1.01,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,2,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,2,power_law_1.01,0.07264000177383423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,2,power_law_1.01,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,2,power_law_1.01,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,2,power_law_1.01,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,2,power_law_1.01,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,2,power_law_1.01,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,2,power_law_1.01,0.09619200229644775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,2,power_law_1.01,0.10561920404434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,2,power_law_1.01,0.12524800300598143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,2,power_law_1.01,0.13224320411682128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,2,power_law_1.01,0.14083839654922486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,2,power_law_1.01,0.17011840343475343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,2,power_law_1.01,0.18876800537109376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,2,power_law_1.01,0.23948159217834472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,2,power_law_1.01,0.28993279933929444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.01,0.3767616033554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,power_law_1.01,0.09162240028381348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.01,0.5690752029418945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.01,0.7753151893615723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,power_law_1.01,0.11683199405670167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,power_law_1.2,0.45185279846191406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.01,1.1593088150024413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,power_law_1.01,0.1735551953315735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,power_law_1.2,0.5006656169891357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.01,1.5080831527709961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,power_law_1.01,0.19914239645004272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.01,2.2259136199951173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,power_law_1.2,0.5059840202331543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.01,3.3033470153808593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,power_law_1.2,0.5399680137634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,power_law_1.01,0.36481919288635256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.01,4.036531066894531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,power_law_1.2,0.5657792091369629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,power_law_1.01,0.5243648052215576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,power_law_1.2,0.5780799865722657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.01,5.542425537109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,power_law_1.01,0.614470386505127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,power_law_1.2,0.6018303871154785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,2,power_law_1.01,8.061055755615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,power_law_1.01,0.8166015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,power_law_1.2,0.6030399799346924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,2,power_law_1.01,10.775283050537109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,power_law_1.01,0.866585636138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,power_law_1.2,0.6346047878265381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,power_law_1.2,0.6524223804473877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,power_law_1.01,0.8612607955932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,2,power_law_1.01,20.89812469482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,power_law_1.2,0.6728896141052246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,power_law_1.01,0.91778564453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,power_law_1.2,0.6794432163238525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,power_law_1.01,0.9640512466430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,power_law_1.2,0.7511295795440673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,power_law_1.01,0.9820927619934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,power_law_1.2,0.806828784942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,power_law_1.2,0.9460927963256835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,power_law_1.01,1.0414848327636719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,power_law_1.2,1.0087679862976073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,power_law_1.01,1.0543999671936035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,2,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,power_law_1.2,1.2244223594665526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,power_law_1.01,1.072812843322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,2,power_law_1.2,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,power_law_1.2,1.483903980255127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,power_law_1.01,1.1313983917236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,2,power_law_1.2,0.033542400598526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,power_law_1.2,1.906822395324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,2,power_law_1.2,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,power_law_1.01,1.2354175567626953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,2,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,power_law_1.2,2.3338176727294924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,power_law_1.01,1.2829376220703126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,2,power_law_1.2,0.049907198548316954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,power_law_1.2,3.226764678955078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,2,power_law_1.2,0.047635200619697574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,power_law_1.01,1.4496383666992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,2,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,power_law_1.2,4.188467025756836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,power_law_1.01,1.594438362121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,2,power_law_1.2,0.04906879961490631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,power_law_1.2,5.070777511596679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,2,power_law_1.2,0.04991360008716583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,power_law_1.01,1.8848255157470704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,2,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,power_law_1.01,2.1005056381225584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,power_law_1.2,7.87509765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,2,power_law_1.2,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,2,power_law_1.2,0.07406079769134521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,power_law_1.01,2.567238426208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,2,power_law_1.2,0.08472959995269776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,power_law_1.2,18.393830871582033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,2,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,power_law_1.01,3.115500831604004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,2,power_law_1.2,0.12485760450363159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,2,power_law_1.2,0.14575999975204468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,power_law_1.01,4.117574310302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,2,power_law_1.2,0.20718719959259033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.2,0.26781439781188965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,power_law_1.01,5.433004760742188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.2,0.38985600471496584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.2,0.49863038063049314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,power_law_1.01,6.524806213378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.2,0.7420608043670655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.2,0.9706879615783691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,power_law_1.01,10.155699157714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.2,1.4435456275939942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.2,1.9059904098510743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,2,power_law_1.01,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.2,2.851353645324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,power_law_1.01,19.978720092773436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,2,power_law_1.01,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.2,3.7897407531738283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,2,power_law_1.01,0.09127680063247681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,2,power_law_1.2,4.730598449707031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,2,power_law_1.01,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,2,power_law_1.01,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,2,power_law_1.2,7.530802917480469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,2,power_law_1.01,0.11092480421066284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,2,power_law_1.01,0.11175680160522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,2,power_law_1.2,15.04943389892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,2,power_law_1.01,0.1121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,2,power_law_1.01,0.11413760185241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,2,power_law_1.01,0.1215872049331665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,2,power_law_1.01,0.12362879514694214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,2,power_law_1.01,0.1264256000518799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,2,power_law_1.01,0.13017599582672118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,2,power_law_1.2,0.0742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,2,power_law_1.01,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,2,power_law_1.2,0.07871999740600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,2,power_law_1.01,0.1418496012687683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,2,power_law_1.2,0.0883520007133484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,2,power_law_1.01,0.14965759515762328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,1,power_law_1.01,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,2,power_law_1.2,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,2,power_law_1.01,0.187718403339386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,1,power_law_1.01,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,2,power_law_1.2,0.11005439758300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,2,power_law_1.01,0.2061568021774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,1,power_law_1.01,0.04211199879646301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,2,power_law_1.2,0.11210240125656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.01,0.23237760066986085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,1,power_law_1.01,0.05010560154914856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,2,power_law_1.2,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.01,0.3145024061203003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,1,power_law_1.01,0.05398399829864502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,2,power_law_1.2,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.01,0.38045439720153806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,1,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,2,power_law_1.2,0.11269760131835938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.01,0.4953152179718018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,1,power_law_1.01,0.05829120278358459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,2,power_law_1.2,0.11967999935150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.01,0.6149312019348144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,1,power_law_1.01,0.061587202548980716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,2,power_law_1.2,0.1251520037651062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.01,0.8600768089294434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,1,power_law_1.01,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,2,power_law_1.2,0.12906880378723146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,1,power_law_1.01,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.01,1.2952639579772949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,power_law_1.2,0.09000319838523865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,2,power_law_1.2,0.12949119806289672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,1,power_law_1.01,0.06996480226516724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.01,2.032153511047363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,power_law_1.2,0.11744639873504639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,2,power_law_1.2,0.13647359609603882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,1,power_law_1.01,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.01,2.3098623275756838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,2,power_law_1.2,0.14506880044937134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,power_law_1.2,0.14161280393600464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,1,power_law_1.01,0.08655359745025634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,2,power_law_1.01,2.9877567291259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,2,power_law_1.2,0.14958720207214354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,1,power_law_1.01,0.09127680063247681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,power_law_1.2,0.2048959970474243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,2,power_law_1.2,0.18645119667053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,2,power_law_1.01,5.717113494873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,1,power_law_1.01,0.1162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,2,power_law_1.2,0.2120448112487793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,power_law_1.2,0.32016639709472655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,1,power_law_1.01,0.12711679935455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,2,power_law_1.01,11.851699066162109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.2,0.24992640018463136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,1,power_law_1.01,0.15557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,power_law_1.2,0.44121599197387695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.2,0.30789120197296144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,1,power_law_1.01,0.21311359405517577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,power_law_1.2,0.5649216175079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.2,0.35641601085662844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.01,0.2755903959274292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.2,0.5911359786987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.01,0.387827205657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,power_law_1.2,0.766649580001831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.2,0.6275904178619385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.01,0.49695358276367185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,power_law_1.2,0.8112895965576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.01,0.7298367977142334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.2,0.9546496391296386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.01,0.9583935737609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.2,1.1711296081542968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,power_law_1.2,0.8469440460205078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.01,1.4218560218811036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,1,power_law_1.2,0.031462401151657104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.2,1.9383039474487305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,power_law_1.2,0.9001728057861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,1,power_law_1.2,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.01,1.8799808502197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.2,2.834899139404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,power_law_1.2,0.9292672157287598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,1,power_law_1.2,0.0316864013671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.01,2.790323257446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,2,power_law_1.2,3.1615680694580077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,1,power_law_1.2,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,power_law_1.2,0.9673727989196778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.01,3.7020801544189452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,2,power_law_1.2,5.553855895996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,1,power_law_1.2,0.036185601353645326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,1,power_law_1.01,4.611827087402344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,power_law_1.2,1.0328767776489258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,1,power_law_1.2,0.04991360008716583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,2,power_law_1.2,9.435820770263671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,1,power_law_1.2,0.04947839975357056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,1,power_law_1.01,7.386239624023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,power_law_1.2,1.0568448066711427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,1,power_law_1.2,0.05338240265846252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,power_law_1.2,1.0838848114013673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,1,power_law_1.2,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,1,power_law_1.01,14.72423095703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,1,power_law_1.2,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,power_law_1.2,1.1350784301757812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,1,power_law_1.2,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,1,power_law_1.2,0.07608960270881653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,power_law_1.2,1.2772159576416016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,1,power_law_1.2,0.07631360292434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,power_law_1.2,1.3492992401123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,1,power_law_1.2,0.08286719918251037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,1,power_law_1.2,0.1047808051109314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,power_law_1.2,1.5489791870117187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,1,power_law_1.2,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,power_law_1.2,1.6321344375610352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,1,power_law_1.2,0.14205440282821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,1,power_law_1.01,0.05803520083427429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,1,power_law_1.2,0.20062720775604248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,power_law_1.2,1.9862335205078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,1,power_law_1.01,0.07052159905433655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.2,0.2571455955505371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,1,power_law_1.01,0.07278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,power_law_1.2,2.139423942565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.2,0.37776000499725343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,1,power_law_1.2,0.05687680244445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,1,power_law_1.01,0.10617599487304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,1,power_law_1.2,0.06607360243797303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.2,0.48919038772583007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,power_law_1.2,2.604934310913086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,1,power_law_1.01,0.10533119440078735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,1,power_law_1.2,0.0775488018989563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.2,0.7203968048095704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,1,power_law_1.01,0.10759040117263793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,1,power_law_1.2,0.10437120199203491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.2,0.9440447807312011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,power_law_1.2,3.7434112548828127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,1,power_law_1.01,0.1082111954689026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,1,power_law_1.2,0.10437120199203491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.2,1.4107839584350585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,1,power_law_1.01,0.10944639444351197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,power_law_1.2,4.678124618530274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,1,power_law_1.2,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.2,1.8660543441772461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,1,power_law_1.01,0.10841599702835084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,1,power_law_1.2,0.10806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.2,2.7813119888305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,power_law_1.2,5.364614486694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,1,power_law_1.01,0.11191040277481079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,1,power_law_1.2,0.10869120359420777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.2,3.6848896026611326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,1,power_law_1.01,0.11313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,1,power_law_1.2,0.10887680053710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,power_law_1.2,6.4664451599121096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,1,power_law_1.01,0.11845760345458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,1,power_law_1.2,4.607308959960937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,1,power_law_1.2,0.110534405708313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,1,power_law_1.01,0.12213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,1,power_law_1.2,0.11360000371932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,1,power_law_1.2,7.366169738769531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,power_law_1.2,10.260761260986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,1,power_law_1.01,0.12522239685058595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,1,power_law_1.2,0.11809920072555542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,1,power_law_1.01,0.13812479972839356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,1,power_law_1.2,14.631443786621094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,1,power_law_1.2,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,1,power_law_1.01,0.14506239891052247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,1,power_law_1.2,0.1258944034576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,power_law_1.2,19.50257263183594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,1,power_law_1.01,0.15489280223846436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,1,power_law_1.2,0.1418496012687683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,1,power_law_1.01,0.18183679580688478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,1,power_law_1.2,0.14492160081863403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.01,0.21349120140075684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,1,power_law_1.2,0.1576192021369934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.01,0.2607935905456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,1,power_law_1.2,0.1879040002822876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.01,0.3201792001724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.2,0.21191039085388183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.01,0.4207359790802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.2,0.26370561122894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.2,0.3179903984069824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.01,0.5087999820709228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.2,0.4203904151916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.01,0.7084735870361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.2,0.5154176235198975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.01,0.9104127883911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.2,0.7212351799011231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.01,1.312019157409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.2,0.9223615646362304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.01,1.7226367950439454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.2,1.3325568199157716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,1,power_law_1.01,2.158252716064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.2,1.752191925048828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,1,power_law_1.01,3.4974464416503905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,1,power_law_1.2,2.2037824630737304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,1,power_law_1.01,7.404621124267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,2,power_law_1.01,0.06812160015106201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,1,power_law_1.2,3.520435333251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,2,power_law_1.01,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,2,power_law_1.2,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,1,power_law_1.2,7.443583679199219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,2,power_law_1.01,0.07343999743461609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,2,power_law_1.2,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,2,power_law_1.01,0.10172159671783447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,2,power_law_1.2,0.09347839951515198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,2,power_law_1.01,0.1369279980659485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,2,power_law_1.2,0.11232000589370728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,2,power_law_1.01,0.1791167974472046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,2,power_law_1.2,0.1280959963798523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,2,power_law_1.01,0.14615039825439452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,2,power_law_1.2,0.16106879711151123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,2,power_law_1.01,0.19591679573059081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,2,power_law_1.2,0.15123840570449829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,2,power_law_1.01,0.15230720043182372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,2,power_law_1.2,0.16473599672317504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,2,power_law_1.01,0.17829760313034057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,2,power_law_1.2,0.14978560209274291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,2,power_law_1.01,0.2018496036529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,2,power_law_1.2,0.15286400318145751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,2,power_law_1.01,0.21456000804901124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,2,power_law_1.2,0.16754560470581054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,2,power_law_1.01,0.20554239749908448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,2,power_law_1.2,0.18688640594482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,2,power_law_1.2,0.187283194065094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,2,power_law_1.2,0.22824320793151856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,2,power_law_1.01,0.1172287940979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,2,power_law_1.2,0.2808768033981323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,2,power_law_1.01,0.11210880279541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,2,power_law_1.2,0.27124478816986086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,2,power_law_1.01,0.13114880323410033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,2,power_law_1.2,0.1004863977432251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,2,power_law_1.2,0.39904639720916746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,2,power_law_1.2,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,2,power_law_1.01,0.15818239450454713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,2,power_law_1.2,0.48546562194824217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,2,power_law_1.2,0.12036479711532592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,2,power_law_1.01,0.15942399501800536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.2,0.6355904102325439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,2,power_law_1.2,0.1574336051940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,2,power_law_1.01,0.16104960441589355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.2,1.046003246307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,2,power_law_1.2,0.15781760215759277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,2,power_law_1.01,0.16145919561386107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.2,1.3308927536010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,2,power_law_1.2,0.1598847985267639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,2,power_law_1.01,0.16222720146179198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.2,2.031711959838867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,2,power_law_1.2,0.1600767970085144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,2,power_law_1.01,0.16433919668197633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,2,power_law_1.2,0.16131839752197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.2,2.3821056365966795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,2,power_law_1.01,0.16617599725723267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,2,power_law_1.2,0.163372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,2,power_law_1.01,0.1672063946723938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.2,3.443795013427734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,2,power_law_1.2,0.16417920589447021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,2,power_law_1.01,0.17189760208129884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.2,4.917132949829101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,2,power_law_1.2,0.1670591950416565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,2,power_law_1.01,0.1739583969116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.2,7.749504089355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,2,power_law_1.2,0.17278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,2,power_law_1.01,0.18481279611587526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,2,power_law_1.2,0.1832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,2,power_law_1.01,0.20816640853881835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.2,9.107328033447265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,2,power_law_1.2,0.20105600357055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,2,power_law_1.01,0.22782719135284424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,2,power_law_1.2,0.20904319286346434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,2,power_law_1.2,13.110150146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,2,power_law_1.01,0.23600640296936035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,2,power_law_1.2,0.2444607973098755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,2,power_law_1.01,0.28721280097961427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,2,power_law_1.2,0.23607680797576905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,2,power_law_1.2,19.26622772216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.01,0.3347264051437378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,2,power_law_1.2,0.2956608057022095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.01,0.4139840126037598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.2,0.35341439247131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.01,0.534611177444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.2,0.44905600547790525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,2,power_law_1.2,41.837643432617185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.01,0.7039680004119873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.2,0.5739903926849366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.01,0.9337599754333497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.2,0.6896959781646729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.01,1.2944064140319824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.2,0.9354623794555664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.01,1.5940287590026856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.2,1.3878399848937988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.01,2.809107208251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.2,2.1077375411987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.01,3.542496109008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.2,2.71964168548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.2,3.6967681884765624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,2,power_law_1.01,4.713337707519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,2,power_law_1.2,5.195232009887695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,2,power_law_1.01,7.963053131103516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,2,power_law_1.2,7.657804870605469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,1,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,2,power_law_1.01,15.617312622070312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,1,power_law_1.01,0.0529151976108551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,1,power_law_1.01,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,2,power_law_1.2,19.040800476074217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,1,power_law_1.01,0.12008960247039795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,1,power_law_1.01,0.11805440187454223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,1,power_law_1.01,0.12502399682998658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,1,power_law_1.01,0.1295232057571411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,1,power_law_1.01,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,1,power_law_1.01,0.13320959806442262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,1,power_law_1.01,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,1,power_law_1.01,0.13854080438613892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,1,power_law_1.01,0.16802560091018676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,1,power_law_1.01,0.17744640111923218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,1,power_law_1.01,0.1987328052520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,1,power_law_1.2,0.04472959935665131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,1,power_law_1.01,0.21349759101867677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,1,power_law_1.2,0.063372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,1,power_law_1.01,0.23601920604705812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,1,power_law_1.2,0.08015999794006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,1,power_law_1.01,0.2857919931411743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,1,power_law_1.2,0.11559679508209228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,1,power_law_1.01,0.3812096118927002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,1,power_law_1.2,0.11477119922637939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.01,0.47481598854064944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,1,power_law_1.2,0.12541439533233642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,1,power_law_1.01,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.01,0.668339204788208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,1,power_law_1.2,0.13031680583953859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,1,power_law_1.01,0.09822720289230347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.01,0.8547136306762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,1,power_law_1.2,0.13320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,1,power_law_1.01,0.10111360549926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.01,1.2317440032958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,1,power_law_1.2,0.13217920064926147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,1,power_law_1.01,0.146943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.01,1.6087936401367187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,1,power_law_1.2,0.1348479986190796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,1,power_law_1.01,0.150873601436615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.01,2.3772096633911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,1,power_law_1.2,0.13852159976959227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,1,power_law_1.01,0.14819200038909913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.01,3.1589183807373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,1,power_law_1.2,0.16575360298156738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,1,power_law_1.01,0.15148799419403075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.01,4.617907333374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,1,power_law_1.2,0.17455999851226806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,1,power_law_1.01,0.15230720043182372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,1,power_law_1.2,0.19258879423141478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,1,power_law_1.01,0.15270400047302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.01,6.165375900268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,1,power_law_1.2,0.21717119216918945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,1,power_law_1.01,0.15352959632873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,1,power_law_1.01,7.679462432861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,1,power_law_1.01,0.16416640281677247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,1,power_law_1.2,0.2392575979232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,1,power_law_1.01,0.16785279512405396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,1,power_law_1.2,0.2790271997451782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,1,power_law_1.01,12.231558227539063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,1,power_law_1.01,0.17237759828567506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,1,power_law_1.2,0.36871678829193116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,1,power_law_1.01,0.1711359977722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.2,0.4735743999481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,1,power_law_1.01,24.297337341308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,1,power_law_1.01,0.19552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.2,0.6556479930877686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,1,power_law_1.01,0.20207359790802001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.2,0.8399552345275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,1,power_law_1.01,0.21619839668273927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.2,1.2255999565124511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,1,power_law_1.01,0.2563456058502197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.2,1.6136896133422851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.01,0.30303359031677246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.2,2.366143989562988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.01,0.37102720737457273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.2,3.123276710510254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.01,0.4429056167602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.01,0.578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.2,4.6371711730957035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.01,0.7171328067779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.2,6.178476715087891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.01,0.996070384979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,1,power_law_1.2,7.681094360351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.01,1.2759615898132324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.01,1.8558336257934571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,1,power_law_1.2,12.233184051513671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.01,2.4812799453735352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,1,power_law_1.01,3.050828742980957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,1,power_law_1.2,24.259642028808592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,1,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,1,power_law_1.01,5.056857681274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,1,power_law_1.2,0.08446080088615418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,1,power_law_1.2,0.09675520062446594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,1,power_law_1.01,11.004441833496093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,1,power_law_1.2,0.1495296001434326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,1,power_law_1.2,0.14958720207214354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,1,power_law_1.2,0.1519871950149536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,1,power_law_1.2,0.1527999997138977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,1,power_law_1.2,0.15367679595947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,1,power_law_1.2,0.15574400424957274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,1,power_law_1.2,0.1590208053588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,1,power_law_1.2,0.16270079612731933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,1,power_law_1.2,0.1659775972366333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,1,power_law_1.2,0.16966400146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,1,power_law_1.2,0.17662080526351928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,1,power_law_1.2,0.19874559640884398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,2,power_law_1.01,0.05189759731292724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,1,power_law_1.2,0.2024319887161255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,1,power_law_1.2,0.21656320095062256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,2,power_law_1.01,0.053529602289199826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,1,power_law_1.2,0.2587519884109497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,2,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,2,power_law_1.01,0.057017600536346434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.2,0.29909119606018064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,2,power_law_1.2,0.05359359979629517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.2,0.3705663919448853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,2,power_law_1.01,0.07012479901313781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.2,0.4477695941925049
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,2,power_law_1.2,0.0574720025062561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,2,power_law_1.01,0.1102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.2,0.5853888034820557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,2,power_law_1.2,0.07121279835700989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,2,power_law_1.01,0.11129599809646606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.2,0.7158592224121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,2,power_law_1.2,0.1107200026512146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.2,0.9955519676208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,2,power_law_1.01,0.11190400123596192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.2,1.2878591537475585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,2,power_law_1.2,0.11215360164642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,2,power_law_1.01,0.13238400220870972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.2,1.8721536636352538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,2,power_law_1.2,0.11418880224227905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,2,power_law_1.01,0.15694719552993774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.2,2.46364803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,2,power_law_1.2,0.13633279800415038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,2,power_law_1.01,0.17662080526351928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,1,power_law_1.2,3.0700351715087892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,2,power_law_1.2,0.16110719442367555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,2,power_law_1.01,0.22311038970947267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,1,power_law_1.2,5.095296096801758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,2,power_law_1.2,0.18343679904937743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,2,power_law_1.01,0.2691967964172363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,1,power_law_1.2,11.017913818359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,2,power_law_1.2,0.2297152042388916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,2,power_law_1.01,0.3164992094039917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,2,power_law_1.2,0.2715008020401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,2,power_law_1.01,0.40026240348815917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,2,power_law_1.2,0.321670389175415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,2,power_law_1.01,0.2863935947418213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,2,power_law_1.2,0.41034879684448244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,2,power_law_1.01,0.33717761039733884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,2,power_law_1.2,0.2950527906417847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,2,power_law_1.2,0.3425407886505127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,2,power_law_1.01,0.43076481819152834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,2,power_law_1.2,0.44572157859802247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,2,power_law_1.01,0.35192959308624266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,2,power_law_1.2,0.3554752111434937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.01,0.4436863899230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.2,0.45807361602783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.01,0.6884223937988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.2,0.6921664237976074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.01,0.9042816162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.2,0.9333888053894043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.01,1.300979232788086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,2,power_law_1.01,0.11314560174942016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.2,1.3559103965759278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.01,1.737798309326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,2,power_law_1.01,0.14631680250167847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.2,1.7788223266601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.01,2.6036863327026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,2,power_law_1.01,0.1411903977394104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.2,2.723763275146484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.01,3.487200164794922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,2,power_law_1.01,0.17128959894180298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.2,3.4553150177001952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,2,power_law_1.01,0.2628544092178345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.01,5.096934509277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.2,5.348684692382813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,2,power_law_1.01,0.3238976001739502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.01,6.980883026123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,2,power_law_1.01,0.4236032009124756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.2,7.0984962463378904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,2,power_law_1.01,8.681132507324218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,2,power_law_1.01,0.4600639820098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,2,power_law_1.2,9.021158599853516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,2,power_law_1.01,0.47480320930480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,2,power_law_1.01,13.759353637695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,2,power_law_1.01,0.48129920959472655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,2,power_law_1.01,0.25374081134796145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,2,power_law_1.2,14.072550964355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,2,power_law_1.01,0.2919680118560791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,2,power_law_1.01,0.50348801612854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,2,power_law_1.01,0.31571838855743406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,2,power_law_1.01,27.355621337890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,2,power_law_1.01,0.5263936042785644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,2,power_law_1.01,0.42427520751953124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,2,power_law_1.2,28.367608642578126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,2,power_law_1.01,0.5214975833892822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,2,power_law_1.01,0.6042816162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.01,0.7470272064208985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,2,power_law_1.01,0.5509888172149658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.01,1.081881618499756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,2,power_law_1.01,0.5620543956756592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.01,1.4308544158935548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,2,power_law_1.01,0.5821119785308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.01,2.287334442138672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,2,power_law_1.01,0.6025983810424804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.01,2.9427007675170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,2,power_law_1.01,0.657696008682251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.01,4.516787338256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.01,0.7088960170745849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.01,5.953446578979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,1,power_law_1.01,0.031065601110458373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.01,0.8403136253356933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.01,8.300479888916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,1,power_law_1.01,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.01,0.8657855987548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.01,12.156237030029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,1,power_law_1.01,0.03885439932346344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.01,1.0328831672668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,2,power_law_1.01,14.535186767578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,2,power_law_1.2,0.11210240125656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,1,power_law_1.01,0.0546176016330719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.01,1.24650239944458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,2,power_law_1.2,0.13975679874420166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,1,power_law_1.01,0.12485120296478272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.01,1.58787841796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,2,power_law_1.01,21.551231384277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,2,power_law_1.2,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,1,power_law_1.01,0.096806401014328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.01,1.8512704849243165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,2,power_law_1.2,0.16513919830322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,1,power_law_1.01,0.11419520378112794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.01,2.493516731262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,2,power_law_1.01,46.53480224609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,1,power_law_1.01,0.13180160522460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,2,power_law_1.2,0.2292543888092041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.01,2.9942527770996095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,1,power_law_1.01,0.12220159769058228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,2,power_law_1.2,0.28517119884490966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,2,power_law_1.01,3.676639938354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,1,power_law_1.01,0.13467520475387573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,2,power_law_1.2,0.43752322196960447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,1,power_law_1.01,0.16090879440307618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,2,power_law_1.2,0.4506368160247803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,2,power_law_1.01,5.431788635253906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,1,power_law_1.01,0.18528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,2,power_law_1.2,0.45145602226257325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,1,power_law_1.01,0.20924160480499268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,2,power_law_1.01,10.774816131591797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,2,power_law_1.2,0.4719359874725342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,1,power_law_1.01,0.25961599349975584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,2,power_law_1.2,0.5001984119415284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,1,power_law_1.2,0.030847999453544616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,1,power_law_1.01,0.2006335973739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,2,power_law_1.2,0.5325568199157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,1,power_law_1.2,0.05358080267906189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,1,power_law_1.01,0.22767360210418702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,2,power_law_1.2,0.5440063953399659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,1,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,1,power_law_1.01,0.28071041107177735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,2,power_law_1.2,0.5497600078582764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,1,power_law_1.2,0.10274560451507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,1,power_law_1.01,0.23912320137023926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,2,power_law_1.2,0.5780159950256347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,1,power_law_1.2,0.20718719959259033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.01,0.2958656072616577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,2,power_law_1.2,0.588262414932251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,1,power_law_1.2,0.19203840494155883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.01,0.4234623908996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,2,power_law_1.2,0.6247231960296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,1,power_law_1.2,0.26451199054718016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.01,0.5375296115875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,2,power_law_1.2,0.6929215908050537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,1,power_law_1.2,0.3145087957382202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.01,0.7703807830810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.2,0.756825590133667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,1,power_law_1.2,0.2964735984802246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.01,1.0022336006164552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.2,0.8870783805847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,1,power_law_1.2,0.32186241149902345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.01,1.472640037536621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.2,0.8841983795166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,1,power_law_1.2,0.3417344093322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.01,1.9502336502075195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.2,1.1301759719848632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,1,power_law_1.01,0.10412160158157349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,1,power_law_1.2,0.38124799728393555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.01,2.8914880752563477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.2,1.298515224456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,1,power_law_1.01,0.13178240060806273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,1,power_law_1.2,0.38881280422210696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.01,3.8487167358398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.2,1.6276159286499023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,1,power_law_1.01,0.14058239459991456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,1,power_law_1.2,0.44004478454589846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,1,power_law_1.01,0.22271358966827393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,1,power_law_1.2,0.39273600578308104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.2,1.9665599822998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,1,power_law_1.01,4.789977645874023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,1,power_law_1.01,0.3031872034072876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,1,power_law_1.2,0.4322495937347412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.2,2.6651391983032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,1,power_law_1.01,7.633638763427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,1,power_law_1.01,0.38430080413818357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,1,power_law_1.2,0.48181757926940916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.2,3.0941888809204103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,1,power_law_1.01,0.5206783771514892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,1,power_law_1.2,0.4756800174713135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,1,power_law_1.01,15.208370971679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,2,power_law_1.2,3.938380813598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,1,power_law_1.01,0.5632832050323486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.2,0.5338304042816162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,1,power_law_1.01,0.5891007900238037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.2,0.7417088031768799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,2,power_law_1.2,6.011577606201172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,1,power_law_1.01,0.5899007797241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.2,0.8105088233947754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,2,power_law_1.2,11.122150421142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,1,power_law_1.01,0.6169343948364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.2,1.0613951683044434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,1,power_law_1.01,0.6408895969390869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.2,1.3145343780517578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,1,power_law_1.01,0.6523712158203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.2,1.753011131286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,1,power_law_1.01,0.6745024204254151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.2,2.2488256454467774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,1,power_law_1.01,0.6888063907623291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.2,3.2042304992675783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,2,power_law_1.01,0.027116799354553224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,1,power_law_1.01,0.708076810836792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.2,4.127072143554687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,2,power_law_1.01,0.03079040050506592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,1,power_law_1.01,0.7604864120483399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,2,power_law_1.01,0.04186240136623383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,1,power_law_1.01,0.8487872123718262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,1,power_law_1.2,5.130547332763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,2,power_law_1.01,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.01,0.9149248123168945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,1,power_law_1.2,7.9140159606933596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,2,power_law_1.01,0.07646080255508422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.01,1.060915184020996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,2,power_law_1.01,0.10781439542770385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,1,power_law_1.2,0.10027519464492798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.01,1.0859456062316895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,2,power_law_1.01,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,1,power_law_1.2,0.12772480249404908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,1,power_law_1.2,15.439590454101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.01,1.3161215782165527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,2,power_law_1.01,0.1090432047843933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,1,power_law_1.2,0.14266239404678344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,2,power_law_1.01,0.11498240232467652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.01,1.5780672073364257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,1,power_law_1.2,0.20760319232940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,2,power_law_1.01,0.12172800302505493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,1,power_law_1.2,0.2684351921081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.01,1.975174331665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,2,power_law_1.01,0.13401600122451782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,1,power_law_1.2,0.34932479858398435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.01,2.398489570617676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,2,power_law_1.01,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,2,power_law_1.2,0.02900480031967163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,1,power_law_1.2,0.5330239772796631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.01,3.225881576538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,2,power_law_1.01,0.13215359449386596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,2,power_law_1.2,0.03351039886474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,1,power_law_1.2,0.541209602355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,2,power_law_1.01,0.14222079515457153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,2,power_law_1.2,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.01,4.045491027832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,1,power_law_1.2,0.5854400157928467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,2,power_law_1.01,0.13194880485534669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,2,power_law_1.2,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,1,power_law_1.01,4.889657592773437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,1,power_law_1.2,0.6067455768585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,2,power_law_1.2,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,2,power_law_1.01,0.14160640239715577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,1,power_law_1.2,0.6227200031280518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,2,power_law_1.2,0.11093120574951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,2,power_law_1.01,0.15777920484542846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,1,power_law_1.01,7.333350372314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,1,power_law_1.2,0.6487360000610352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,2,power_law_1.2,0.12035839557647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,2,power_law_1.01,0.21164159774780272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,2,power_law_1.2,0.10909440517425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,1,power_law_1.2,0.6614336013793946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.01,0.24870400428771972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,1,power_law_1.01,14.582246398925781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,2,power_law_1.2,0.11747839450836181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.01,0.32039680480957033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,1,power_law_1.2,0.6651135921478272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,2,power_law_1.2,0.12506239414215087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.01,0.39964799880981444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,1,power_law_1.2,0.7167359828948975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,2,power_law_1.2,0.1395967960357666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.01,0.5321536064147949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,1,power_law_1.2,0.7474495887756347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,2,power_law_1.2,0.1264896035194397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.01,0.7174911975860596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,1,power_law_1.2,0.783897590637207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,2,power_law_1.2,0.1344831943511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.01,0.9870207786560059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,1,power_law_1.2,0.8805503845214844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,2,power_law_1.2,0.1461632013320923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.01,1.2919487953186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.2,0.9411968231201172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,2,power_law_1.2,0.1336575984954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,2,power_law_1.01,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.01,1.9772159576416015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.2,1.089247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,2,power_law_1.2,0.14202879667282103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,2,power_law_1.01,0.06071680188179016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,2,power_law_1.2,0.163756799697876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.01,2.6266496658325194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,2,power_law_1.01,0.06972159743309021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.2,1.1363648414611816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,2,power_law_1.01,0.09123200178146362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,2,power_law_1.2,0.2198784112930298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.2,1.3628671646118165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,2,power_law_1.01,3.004083251953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,2,power_law_1.01,0.10823040008544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.2,0.24897279739379882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.2,1.5682880401611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,2,power_law_1.01,5.093241500854492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,2,power_law_1.01,0.15983999967575074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.2,0.32863359451293944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.2,2.004313659667969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,2,power_law_1.01,0.15861120223999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.2,0.4087039947509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,2,power_law_1.01,9.811628723144532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.2,2.4255807876586912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,2,power_law_1.01,0.17047040462493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.2,0.5403903961181641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,2,power_law_1.01,0.16680320501327514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.2,0.7122111797332764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.2,3.2652542114257814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,2,power_law_1.01,0.1717120051383972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.2,1.1228416442871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.2,4.082003021240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,2,power_law_1.01,0.1774335980415344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.2,1.3309184074401856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,2,power_law_1.01,0.1844159960746765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,1,power_law_1.2,4.949939346313476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.2,2.091948890686035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,2,power_law_1.01,0.1840127944946289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.2,2.652895927429199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,1,power_law_1.2,7.54803237915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,2,power_law_1.01,0.19403519630432128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,2,power_law_1.2,0.06232960224151611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,2,power_law_1.2,3.4262462615966798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,2,power_law_1.01,0.20405120849609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,2,power_law_1.2,0.062745600938797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,1,power_law_1.2,14.839532470703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,2,power_law_1.01,0.2085632085800171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,2,power_law_1.2,5.489580917358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,2,power_law_1.2,0.07338879704475403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,2,power_law_1.01,0.2302720069885254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,2,power_law_1.2,0.08405759930610657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,2,power_law_1.01,0.2687936067581177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,2,power_law_1.2,10.406829071044921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,2,power_law_1.2,0.09960960149765015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.01,0.2667455911636353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,2,power_law_1.2,0.15921920537948608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.01,0.32099840641021726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,1,power_law_1.01,0.02184319943189621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,2,power_law_1.2,0.17108479738235474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.01,0.38305280208587644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,1,power_law_1.01,0.02655999958515167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,2,power_law_1.2,0.17027839422225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.01,0.48874878883361816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,1,power_law_1.01,0.04028159976005554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,1,power_law_1.2,0.023078399896621703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,2,power_law_1.2,0.17374720573425292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.01,0.5751552104949951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,1,power_law_1.01,0.06199679970741272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,1,power_law_1.2,0.026348799467086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,2,power_law_1.2,0.17129600048065186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.01,0.7625472068786621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,1,power_law_1.01,0.09619200229644775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,1,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,2,power_law_1.2,0.17969919443130494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,1,power_law_1.01,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.01,0.9669504165649414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,1,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,1,power_law_1.01,0.11176320314407348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,2,power_law_1.2,0.18152960538864135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.01,1.3488832473754884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,1,power_law_1.2,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,1,power_law_1.01,0.11790080070495605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,2,power_law_1.2,0.1876736044883728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.01,1.678828811645508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,1,power_law_1.2,0.13898240327835082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,1,power_law_1.01,0.12321280241012574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,2,power_law_1.2,0.1987328052520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,1,power_law_1.2,0.11297279596328735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,2,power_law_1.01,2.1730112075805663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,1,power_law_1.01,0.13224320411682128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,2,power_law_1.2,0.20897281169891357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,1,power_law_1.2,0.11830400228500366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,2,power_law_1.01,3.13187198638916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,1,power_law_1.01,0.12363519668579101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,2,power_law_1.2,0.21305599212646484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,1,power_law_1.2,0.12526079416275024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,1,power_law_1.01,0.13508479595184325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,2,power_law_1.2,0.2278208017349243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,1,power_law_1.2,0.13509119749069215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,2,power_law_1.01,6.131391906738282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,1,power_law_1.01,0.14164479970932006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,2,power_law_1.2,0.26344320774078367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,1,power_law_1.2,0.12833280563354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,1,power_law_1.01,0.13201919794082642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.2,0.27061119079589846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,1,power_law_1.2,0.1363263964653015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,1,power_law_1.01,0.15022079944610595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.2,0.3277631998062134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,1,power_law_1.2,0.14450559616088868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,1,power_law_1.01,0.1615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.2,0.40865278244018555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,1,power_law_1.2,0.13345279693603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,1,power_law_1.01,0.14163199663162232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,1,power_law_1.2,0.15741440057754516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.2,0.4952832221984863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,1,power_law_1.01,0.18814079761505126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,1,power_law_1.2,0.1613055944442749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.2,0.6275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.01,0.2137279987335205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,1,power_law_1.2,0.14903039932250978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.2,0.8510272026062011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.01,0.2655616044998169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,1,power_law_1.2,0.18588160276412963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.01,0.32064640522003174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.2,1.003385639190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,1,power_law_1.01,0.05987840294837952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.2,0.21478400230407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.01,0.4281792163848877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.2,1.344377613067627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,1,power_law_1.01,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.2,0.26986238956451414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.01,0.5440896034240723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.2,1.779167938232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,1,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.2,0.3210495948791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.01,0.772435188293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,1,power_law_1.01,0.11066880226135253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.2,0.4342912197113037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,2,power_law_1.2,2.247551918029785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.01,0.9932160377502441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,1,power_law_1.01,0.13524479866027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.2,0.5514495849609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,2,power_law_1.2,3.1951616287231444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.01,1.4513407707214356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,1,power_law_1.01,0.19504640102386475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.2,0.7769408226013184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,1,power_law_1.01,0.20980479717254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.01,1.904755210876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.2,1.0030271530151367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,2,power_law_1.2,6.508403015136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,1,power_law_1.01,0.21697919368743895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,1,power_law_1.01,2.3592191696166993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.2,1.4472448348999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,1,power_law_1.01,0.2185983896255493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,1,power_law_1.01,3.7041473388671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.2,1.9035327911376954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,1,power_law_1.01,0.22187519073486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,1,power_law_1.01,0.22946560382843018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,1,power_law_1.2,2.3563520431518556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,1,power_law_1.01,7.36657943725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,1,power_law_1.01,0.23313920497894286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,1,power_law_1.2,3.7225662231445313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,1,power_law_1.01,0.23991680145263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,1,power_law_1.01,0.25691521167755127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,1,power_law_1.2,7.355110168457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,1,power_law_1.01,0.2654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,1,power_law_1.01,0.2652992010116577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,1,power_law_1.2,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,1,power_law_1.01,0.2978559970855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,1,power_law_1.2,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,1,power_law_1.01,0.3549760103225708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,1,power_law_1.2,0.08179839849472045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,2,power_law_1.01,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.01,0.35376639366149903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,1,power_law_1.2,0.10206079483032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,2,power_law_1.01,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.01,0.43916797637939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,1,power_law_1.2,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,2,power_law_1.01,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.01,0.49692158699035643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,1,power_law_1.2,0.20283520221710205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,2,power_law_1.01,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.01,0.648799991607666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,1,power_law_1.2,0.21266560554504393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,2,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,2,power_law_1.01,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.01,0.7785280227661133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,1,power_law_1.2,0.220032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,2,power_law_1.2,0.047865599393844604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,2,power_law_1.01,0.11155840158462524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.01,1.0484543800354005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,1,power_law_1.2,0.22352640628814696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,2,power_law_1.2,0.08511999845504761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,2,power_law_1.01,0.13428479433059692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.01,1.2972864151000976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,1,power_law_1.2,0.22699520587921143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,2,power_law_1.2,0.1142016053199768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,2,power_law_1.01,0.1588544011116028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.01,1.8328319549560548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,1,power_law_1.2,0.23129599094390868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,2,power_law_1.2,0.1512768030166626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,2,power_law_1.01,0.17401599884033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.01,2.3538496017456056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,1,power_law_1.2,0.23598721027374267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,2,power_law_1.01,0.19263999462127684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,2,power_law_1.2,0.23566079139709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,1,power_law_1.01,2.8787456512451173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,2,power_law_1.01,0.23811841011047363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,1,power_law_1.2,0.2435904026031494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,2,power_law_1.2,0.2594111919403076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,1,power_law_1.01,4.402048110961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,2,power_law_1.01,0.26371839046478274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,1,power_law_1.2,0.25443201065063475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,2,power_law_1.2,0.29279360771179197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,2,power_law_1.01,0.1996224045753479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,1,power_law_1.2,0.26796159744262693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,2,power_law_1.2,0.2862528085708618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,1,power_law_1.01,8.804838562011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,2,power_law_1.01,0.22868480682373046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,1,power_law_1.2,0.2775871992111206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,2,power_law_1.2,0.3122495889663696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,2,power_law_1.01,0.2693824052810669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,2,power_law_1.2,0.34987521171569824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,2,power_law_1.01,0.21580159664154053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,2,power_law_1.2,0.382694411277771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,2,power_law_1.01,0.2479423999786377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,2,power_law_1.2,0.343174409866333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,2,power_law_1.01,0.35628159046173097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,2,power_law_1.2,0.3796288013458252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.01,0.45642881393432616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,2,power_law_1.2,0.4273536205291748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.01,0.601420783996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,2,power_law_1.2,0.36447360515594485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.01,0.7699840068817139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,2,power_law_1.2,0.41484799385070803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,2,power_law_1.2,0.5411712169647217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.01,1.162502384185791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.2,0.6083839893341064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.01,1.47326717376709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.2,0.8252799987792969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.01,2.184127998352051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,2,power_law_1.01,0.10823040008544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.2,0.9952447891235352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.01,2.907481575012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,2,power_law_1.01,0.13608959913253785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.2,1.3644991874694825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.01,4.262630462646484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,2,power_law_1.01,0.1285055994987488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.2,1.7329343795776366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.01,5.5993598937988285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,2,power_law_1.01,0.1737663984298706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.2,2.572211265563965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,2,power_law_1.01,0.2230976104736328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,2,power_law_1.01,6.956781005859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.2,3.0827903747558594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,2,power_law_1.01,0.32674560546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,2,power_law_1.01,11.305919647216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.2,4.634745788574219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,2,power_law_1.01,0.35207040309906007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,2,power_law_1.01,0.35726079940795896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.2,6.1887870788574215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,2,power_law_1.01,0.37918078899383545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,2,power_law_1.01,22.99630126953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,2,power_law_1.2,8.277529907226562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,2,power_law_1.01,0.3828671932220459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,2,power_law_1.01,0.39492480754852294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,2,power_law_1.2,12.775750732421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,2,power_law_1.01,0.39842560291290285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,2,power_law_1.01,0.4076352119445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,2,power_law_1.01,0.42218880653381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,2,power_law_1.2,23.355718994140624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,2,power_law_1.01,0.4407872200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,2,power_law_1.01,0.44778242111206057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,2,power_law_1.01,0.4747456073760986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,2,power_law_1.01,0.5403584003448486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.01,0.5772223949432373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,1,power_law_1.01,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.01,0.6777728080749512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,1,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,1,power_law_1.01,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.01,0.718726396560669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,2,power_law_1.2,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,1,power_law_1.01,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.01,0.8911680221557617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,2,power_law_1.2,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,1,power_law_1.01,0.1404096007347107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.01,1.07193603515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,2,power_law_1.2,0.12363519668579101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,1,power_law_1.01,0.21539199352264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,2,power_law_1.2,0.15845760107040405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.01,1.4119744300842285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,1,power_law_1.01,0.2553215980529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,2,power_law_1.2,0.20535039901733398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.01,1.7230592727661134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,1,power_law_1.01,0.2399616003036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,2,power_law_1.2,0.32023680210113525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.01,2.2799104690551757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,1,power_law_1.01,0.25961599349975584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,2,power_law_1.2,0.357094407081604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.01,2.8865472793579103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,1,power_law_1.01,0.27312641143798827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,2,power_law_1.2,0.36693758964538575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,1,power_law_1.01,0.29729280471801756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,2,power_law_1.2,0.37983360290527346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,2,power_law_1.01,3.3794815063476564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,1,power_law_1.01,0.31490559577941896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,2,power_law_1.2,0.3835263967514038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,2,power_law_1.01,5.441606521606445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,1,power_law_1.01,0.2843839883804321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,2,power_law_1.2,0.40380158424377444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,1,power_law_1.01,0.3122495889663696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,2,power_law_1.2,0.4087615966796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,2,power_law_1.01,10.56899185180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,2,power_law_1.2,0.41157121658325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,1,power_law_1.01,0.3439872026443481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,2,power_law_1.2,0.42755842208862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,2,power_law_1.2,0.44332160949707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,2,power_law_1.2,0.4662464141845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,2,power_law_1.2,0.49205760955810546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,1,power_law_1.2,0.035718399286270144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,2,power_law_1.2,0.5526847839355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,1,power_law_1.2,0.03901439905166626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.2,0.6043007850646973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,1,power_law_1.2,0.05006719827651977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.2,0.6954304218292237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,1,power_law_1.2,0.08856959939002991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.2,0.7679232120513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,1,power_law_1.2,0.13566720485687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.2,0.9514368057250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,1,power_law_1.2,0.2042623996734619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,1,power_law_1.2,0.2560960054397583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.2,1.086400032043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,1,power_law_1.2,0.23335680961608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.2,1.42225923538208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,1,power_law_1.2,0.2618304014205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.2,1.7104127883911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,1,power_law_1.2,0.2816960096359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.2,2.4894784927368163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,1,power_law_1.2,0.30360960960388184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.2,3.009062385559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,1,power_law_1.2,0.322380805015564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,1,power_law_1.2,0.29614720344543455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,2,power_law_1.2,4.133196640014648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,1,power_law_1.2,0.3308480024337769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,2,power_law_1.2,5.884255981445312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,1,power_law_1.2,0.34416000843048095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,1,power_law_1.2,0.3154815912246704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,2,power_law_1.2,12.520166778564453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,1,power_law_1.2,0.35399041175842283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,1,power_law_1.2,0.4371391773223877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.2,0.5051263809204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.2,0.6218624114990234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.2,0.7588736057281494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.2,1.003001594543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.2,1.250924777984619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.2,1.7590463638305665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.2,2.2593727111816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.2,3.267193603515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.2,4.261772918701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,1,power_law_1.2,5.2888446807861325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,1,power_law_1.2,8.32745590209961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,1,power_law_1.01,0.09230080246925354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,1,power_law_1.01,0.11299200057983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,1,power_law_1.2,16.500819396972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,1,power_law_1.01,0.13654400110244752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,1,power_law_1.01,0.19941760301589967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,1,power_law_1.01,0.24036478996276855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,1,power_law_1.01,0.3738431930541992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,1,power_law_1.01,0.40094718933105467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,1,power_law_1.01,0.4228479862213135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,1,power_law_1.01,0.4269375801086426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,1,power_law_1.01,0.4363711833953857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,1,power_law_1.01,0.45844478607177735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,1,power_law_1.01,0.4601151943206787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,1,power_law_1.01,0.4625984191894531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,1,power_law_1.01,0.4863423824310303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,1,power_law_1.01,0.5043647766113282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,1,power_law_1.01,0.5055935859680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,1,power_law_1.01,0.5572031974792481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,1,power_law_1.01,0.6479167938232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,1,power_law_1.2,0.09306880235671997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.01,0.7077311992645263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,1,power_law_1.2,0.10208640098571778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,1,power_law_1.2,0.13198720216751098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.01,0.8479999542236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,1,power_law_1.2,0.17745280265808105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.01,0.8695039749145508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,1,power_law_1.2,0.22537600994110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.01,1.097862434387207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,1,power_law_1.2,0.37221760749816896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.01,1.309222412109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,1,power_law_1.2,0.4037504196166992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.01,1.7214847564697267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,1,power_law_1.2,0.4184959888458252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.01,2.088262367248535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,1,power_law_1.2,0.44572157859802247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.01,2.8829055786132813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,1,power_law_1.2,0.45162239074707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.01,3.733235168457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,1,power_law_1.2,0.46744961738586427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,1,power_law_1.2,0.48300800323486326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,1,power_law_1.01,4.451667022705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,1,power_law_1.2,0.48424320220947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,1,power_law_1.01,6.769395446777343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,1,power_law_1.2,0.5010367870330811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,1,power_law_1.2,0.5273983955383301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,1,power_law_1.01,13.723788452148437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,1,power_law_1.2,0.5382912158966064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,1,power_law_1.2,0.5825471878051758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,1,power_law_1.2,0.6564735889434814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.2,0.7175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.2,0.8555392265319824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.2,0.8784832000732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.2,1.0916735649108886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.2,1.3296575546264648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.2,1.7254592895507812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.2,2.089798355102539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,1,power_law_1.2,0.30811519622802735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.2,2.859084892272949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,1,power_law_1.2,0.35704960823059084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.2,0.3769151926040649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.2,3.6856704711914063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.2,0.4506432056427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,1,power_law_1.2,4.483558273315429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.2,0.5002111911773681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,2,power_law_1.01,0.11564160585403442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,1,power_law_1.2,6.9600067138671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.2,0.6376319885253906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,2,power_law_1.01,0.15783040523529052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.2,0.7728000164031983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,2,power_law_1.01,0.21539199352264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,1,power_law_1.2,13.812991333007812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.2,1.0320768356323242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,2,power_law_1.01,0.18035839796066283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.2,1.2927231788635254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,2,power_law_1.01,0.2960832118988037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.2,1.8148223876953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,2,power_law_1.01,0.3802367925643921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.2,2.3280511856079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,2,power_law_1.01,0.4490496158599854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,1,power_law_1.2,2.846393585205078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,2,power_law_1.01,0.5649856090545654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,1,power_law_1.2,4.444659042358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,2,power_law_1.01,0.5923967838287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,1,power_law_1.2,8.87488021850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,2,power_law_1.01,0.5886655807495117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,2,power_law_1.01,0.6352191925048828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,2,power_law_1.01,0.6737343788146972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,2,power_law_1.01,0.6987135887145997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,2,power_law_1.01,0.7126272201538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,2,power_law_1.2,0.11785600185394288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,2,power_law_1.01,0.7441792011260986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,2,power_law_1.2,0.15239039659500123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,2,power_law_1.01,0.7323008060455323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,2,power_law_1.2,0.15406080484390258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,2,power_law_1.01,0.7478591918945312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,2,power_law_1.2,0.18606079816818238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,2,power_law_1.01,0.8179007530212402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,2,power_law_1.2,0.2618304014205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,2,power_law_1.01,0.903923225402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,2,power_law_1.2,0.3590912103652954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,2,power_law_1.01,1.0247424125671387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,2,power_law_1.2,0.4170688152313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,2,power_law_1.01,1.1433343887329102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,2,power_law_1.2,0.5198783874511719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,2,power_law_1.01,1.3604160308837892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,2,power_law_1.2,0.5731264114379883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,2,power_law_1.01,1.4296319961547852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,2,power_law_1.2,0.5927807807922363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,1,power_law_1.01,0.115174400806427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,2,power_law_1.2,0.6230976104736328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,2,power_law_1.01,1.784556770324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,1,power_law_1.01,0.1446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,2,power_law_1.2,0.6646656036376953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,2,power_law_1.01,2.161190414428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,1,power_law_1.01,0.19013760089874268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,2,power_law_1.2,0.6769599914550781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,1,power_law_1.01,0.2202239990234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,2,power_law_1.01,2.779257583618164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,2,power_law_1.2,0.6921152114868164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,1,power_law_1.01,0.3498816013336182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,2,power_law_1.01,3.4704769134521483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,2,power_law_1.2,0.7314303874969482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,1,power_law_1.01,0.4727680206298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,2,power_law_1.01,4.082003021240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,2,power_law_1.2,0.7670591831207275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,1,power_law_1.01,0.5530432224273681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,2,power_law_1.2,0.7949120044708252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,2,power_law_1.01,5.973132705688476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,1,power_law_1.01,0.6990719795227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,2,power_law_1.2,0.860051155090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,1,power_law_1.01,0.734278392791748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,1,power_law_1.01,0.3140928030014038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,2,power_law_1.01,10.99298553466797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,2,power_law_1.2,0.9337727546691894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,1,power_law_1.01,0.33641600608825684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,1,power_law_1.01,0.7502592086791993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,2,power_law_1.2,1.0761024475097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,1,power_law_1.01,0.4293824195861816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,1,power_law_1.01,0.8018688201904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,2,power_law_1.2,1.1666239738464355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.01,0.4904191970825195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,1,power_law_1.01,0.8415936470031739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.01,0.6149439811706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,2,power_law_1.2,1.3955840110778808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,1,power_law_1.01,0.8423999786376953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.01,0.7351552009582519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,2,power_law_1.2,1.5125311851501464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.01,0.9813247680664062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,1,power_law_1.01,0.8829631805419922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,2,power_law_1.2,1.8869056701660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.01,1.2526847839355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,1,power_law_1.01,0.8817472457885742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,2,power_law_1.2,2.268441581726074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.01,1.7505407333374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,1,power_law_1.01,0.9223039627075196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,2,power_law_1.2,2.9070079803466795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.01,2.251296043395996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,1,power_law_1.01,0.9644736289978028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.01,3.257459259033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,2,power_law_1.2,3.5783424377441406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,1,power_law_1.01,1.071993637084961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.01,4.2654975891113285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,2,power_law_1.2,4.43480339050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,1,power_law_1.01,1.1440832138061523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,1,power_law_1.01,5.2346240997314455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,2,power_law_1.2,6.304230499267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,1,power_law_1.01,1.321446418762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,1,power_law_1.01,8.303743743896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,1,power_law_1.01,1.4635775566101075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,1,power_law_1.2,0.11544320583343506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,2,power_law_1.2,12.506195068359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,1,power_law_1.01,1.7320703506469726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,1,power_law_1.2,0.14165120124816893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,1,power_law_1.01,16.463591003417967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,1,power_law_1.2,0.163372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,1,power_law_1.01,1.8561088562011718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,1,power_law_1.2,0.20554239749908448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,1,power_law_1.01,2.2897472381591797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,1,power_law_1.2,0.30958080291748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,1,power_law_1.01,2.7624256134033205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,1,power_law_1.2,0.42101120948791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,1,power_law_1.01,3.622995376586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,1,power_law_1.2,0.48919677734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,1,power_law_1.01,4.552364730834961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,1,power_law_1.2,0.6556992053985595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,1,power_law_1.2,0.6757696151733399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,1,power_law_1.01,5.524288177490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,1,power_law_1.2,0.7363840103149414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,1,power_law_1.01,8.0617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,1,power_law_1.2,0.7887551784515381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,1,power_law_1.2,0.8195520401000976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,1,power_law_1.01,15.162783813476562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,1,power_law_1.2,0.8467840194702149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,1,power_law_1.2,0.8781248092651367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,1,power_law_1.2,0.8887743949890137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,1,power_law_1.2,0.9387455940246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,1,power_law_1.2,0.9865920066833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,1,power_law_1.2,1.0937791824340821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,1,power_law_1.2,1.2079808235168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,1,power_law_1.2,1.349766445159912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,1,power_law_1.2,1.4928704261779786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,1,power_law_1.2,1.8095104217529296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,1,power_law_1.2,1.9096895217895509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,1,power_law_1.2,2.3842111587524415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,1,power_law_1.2,2.871443176269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,1,power_law_1.2,3.6991424560546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,1,power_law_1.2,4.654764938354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,1,power_law_1.2,5.562438583374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,1,power_law_1.2,8.22995834350586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,1,power_law_1.2,15.771527099609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,power_law_1.01,0.12010879516601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,power_law_1.01,0.14714239835739135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,power_law_1.2,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,power_law_1.01,0.12871040105819703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,power_law_1.2,0.12178560495376586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,power_law_1.01,0.13893120288848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,power_law_1.2,0.1260800004005432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,power_law_1.01,0.13975679874420166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,power_law_1.2,0.13672959804534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,power_law_1.01,0.14488320350646972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,power_law_1.2,0.13815679550170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,power_law_1.01,0.16352640390396117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,power_law_1.2,0.14533120393753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,power_law_1.01,0.1749824047088623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,power_law_1.2,0.15086079835891725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,power_law_1.01,0.18564480543136597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,power_law_1.2,0.18056319952011107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,power_law_1.01,0.21390719413757325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,power_law_1.2,0.18343679904937743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,power_law_1.01,0.16516480445861817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,power_law_1.2,0.21476480960845948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,power_law_1.01,0.17967360019683837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,power_law_1.2,0.1686784029006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,power_law_1.01,0.18462079763412476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,power_law_1.01,0.07953919768333435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,power_law_1.2,0.18014719486236572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,power_law_1.01,0.21656959056854247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,power_law_1.2,0.17934080362319946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,power_law_1.01,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,power_law_1.01,0.241759991645813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,power_law_1.01,0.09838079810142517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,power_law_1.2,0.21763839721679687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,power_law_1.01,0.25731201171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,power_law_1.2,0.2241919994354248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,power_law_1.01,0.1372928023338318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,power_law_1.01,0.2872191905975342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,power_law_1.2,0.28173439502716063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,power_law_1.01,0.1375040054321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,power_law_1.01,0.3187455892562866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,power_law_1.2,0.2655616044998169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,power_law_1.01,0.1411967992782593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,power_law_1.01,0.4006783962249756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,power_law_1.2,0.3538304090499878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,power_law_1.01,0.14958720207214354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,power_law_1.01,0.527238416671753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,power_law_1.2,0.45971198081970216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,power_law_1.01,0.16043519973754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,power_law_1.01,0.7821887969970703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,power_law_1.2,0.5354688167572021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,power_law_1.01,0.16513919830322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,power_law_1.01,0.8866559982299804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,power_law_1.2,0.9452799797058106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,power_law_1.01,0.16597119569778443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,power_law_1.01,1.2141183853149413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,power_law_1.01,0.15266560316085814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,power_law_1.2,1.23056001663208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,power_law_1.01,2.061580848693848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,power_law_1.01,0.15879039764404296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,power_law_1.2,1.6923904418945312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,power_law_1.01,2.423500823974609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,power_law_1.01,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,power_law_1.2,2.3211200714111326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,power_law_1.01,0.17678719758987427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,power_law_1.01,4.2519489288330075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,power_law_1.2,3.6246784210205076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,power_law_1.01,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,power_law_1.01,5.921644973754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,power_law_1.2,5.7863422393798825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,power_law_1.01,0.19055999517440797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,power_law_1.01,7.605741119384765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,power_law_1.2,6.820595550537109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,power_law_1.01,0.23375999927520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,power_law_1.01,0.25547521114349364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,power_law_1.2,9.089778900146484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,power_law_1.01,14.287571716308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,power_law_1.01,0.32058238983154297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,power_law_1.01,0.415008020401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,power_law_1.2,13.623245239257812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,power_law_1.01,0.5177663803100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,power_law_1.01,34.27191162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,power_law_1.01,0.6540160179138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,power_law_1.01,1.0119999885559081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,power_law_1.2,40.848504638671876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,power_law_1.01,1.4615360260009767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,power_law_1.01,1.5973055839538575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,power_law_1.01,2.947756767272949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,power_law_1.2,0.07879040241241456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,power_law_1.01,3.7004032135009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,power_law_1.2,0.11523840427398682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,power_law_1.01,5.096518325805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,power_law_1.2,0.13898880481719972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,power_law_1.2,0.14125440120697022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,power_law_1.01,8.0229248046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,power_law_1.2,0.14370559453964232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,power_law_1.2,0.15701119899749755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,power_law_1.01,17.586079406738282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,power_law_1.2,0.14944000244140626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,power_law_1.2,0.1551743984222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,power_law_1.2,0.15353599786758423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,power_law_1.2,0.17004159688949586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,power_law_1.2,0.17237119674682616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,power_law_1.2,0.1674623966217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,power_law_1.2,0.17728639841079713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,power_law_1.2,0.18794239759445192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,power_law_1.2,0.19531519412994386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,power_law_1.2,0.2389375925064087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,power_law_1.2,0.27272961139678953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,power_law_1.2,0.2930176019668579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,power_law_1.2,0.42858238220214845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,power_law_1.2,0.5379392147064209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,power_law_1.2,0.7687551975250244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,power_law_1.2,0.8445311546325683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,power_law_1.2,1.3759872436523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,power_law_1.2,2.006771278381348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,power_law_1.2,3.277548980712891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,power_law_1.2,4.240838241577149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,power_law_1.2,4.651935958862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,power_law_1.2,8.434214019775391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,power_law_1.2,19.69496307373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.06275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.07074559926986694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,power_law_1.01,0.1315775990486145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.07241600155830383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,power_law_1.01,0.1340288043022156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,power_law_1.01,0.13648639917373656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,power_law_1.2,0.1369472026824951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,power_law_1.01,0.14056320190429689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,power_law_1.2,0.13326079845428468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,power_law_1.01,0.14324480295181274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,power_law_1.2,0.14042240381240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,power_law_1.01,0.14632320404052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,power_law_1.2,0.14370559453964232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,power_law_1.01,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,power_law_1.2,0.1504639983177185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,power_law_1.01,0.1536960005760193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,power_law_1.2,0.1580288052558899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,power_law_1.01,0.1590208053588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,power_law_1.2,0.15802240371704102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,power_law_1.01,0.16106239557266236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,power_law_1.2,0.1473855972290039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,power_law_1.01,0.16290559768676757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,power_law_1.2,0.15148799419403075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,power_law_1.01,0.17499519586563111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,power_law_1.2,0.1537343978881836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,power_law_1.01,0.18503040075302124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,power_law_1.2,0.16110719442367555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,power_law_1.01,0.19342080354690552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,power_law_1.2,0.1754431962966919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,power_law_1.01,0.22435200214385986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,power_law_1.2,0.18157440423965454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,power_law_1.01,0.26428799629211425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,power_law_1.2,0.19162240028381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,power_law_1.01,0.33044478893280027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,power_law_1.2,0.22439680099487305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,power_law_1.01,0.39842560291290285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,power_law_1.2,0.25920639038085935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,power_law_1.01,0.5305280208587646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,power_law_1.2,0.32330238819122314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,power_law_1.01,0.6540224075317382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,power_law_1.2,0.4023615837097168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,power_law_1.01,0.9399104118347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,power_law_1.2,0.5363071918487549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,power_law_1.01,1.2305343627929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,power_law_1.2,0.6618495941162109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,power_law_1.01,1.8582208633422852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,power_law_1.2,0.9526464462280273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,power_law_1.01,2.467321586608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,power_law_1.2,1.2133567810058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,power_law_1.01,3.1505279541015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,power_law_1.2,1.8263296127319335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,power_law_1.2,2.5095487594604493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,power_law_1.01,5.138604736328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,power_law_1.2,3.2030078887939455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,power_law_1.01,10.770719909667969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,power_law_1.2,5.1059326171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,power_law_1.2,10.792902374267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,power_law_1.01,0.21573119163513182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,power_law_1.01,0.21266560554504393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,power_law_1.01,0.24359679222106934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,power_law_1.01,0.22249600887298585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,power_law_1.01,0.22207999229431152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,power_law_1.01,0.23253118991851807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,power_law_1.01,0.2556735992431641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,power_law_1.01,0.3064703941345215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,power_law_1.01,0.30891520977020265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,power_law_1.01,0.3330944061279297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,power_law_1.01,0.24973440170288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,power_law_1.01,0.2819008111953735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,power_law_1.01,0.28557438850402833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,power_law_1.01,0.32039039134979247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,power_law_1.01,0.33882238864898684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,power_law_1.01,0.40395522117614746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,power_law_1.01,0.39103360176086427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,power_law_1.01,0.5182335853576661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,power_law_1.01,0.5468992233276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,power_law_1.01,0.9222975730895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,power_law_1.01,0.953433609008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,power_law_1.01,1.8969472885131835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,power_law_1.01,2.3432064056396484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,power_law_1.01,3.1718208312988283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,power_law_1.01,4.462604904174805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,power_law_1.01,7.24466552734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,power_law_1.2,0.2133375883102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,power_law_1.2,0.23054080009460448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,power_law_1.01,8.823296356201173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,power_law_1.2,0.1850816011428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,power_law_1.01,14.718258666992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,power_law_1.2,0.22519679069519044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,power_law_1.2,0.21742720603942872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,power_law_1.2,0.22685439586639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,power_law_1.01,25.039161682128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,power_law_1.2,0.23300480842590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,power_law_1.2,0.29258880615234373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,power_law_1.2,0.30407679080963135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,power_law_1.2,0.3526079893112183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,power_law_1.01,49.010763549804686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,power_law_1.2,0.2428287982940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,power_law_1.2,0.2819391965866089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,power_law_1.2,0.2868607997894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,power_law_1.2,0.2905407905578613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,power_law_1.2,0.3835263967514038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,power_law_1.2,0.41445121765136717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,power_law_1.2,0.43267202377319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,power_law_1.2,0.5494080066680909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,power_law_1.2,0.7114175796508789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,power_law_1.2,1.159641647338867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,power_law_1.2,1.2853952407836915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,power_law_1.2,1.7403200149536133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,power_law_1.2,2.5701696395874025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,power_law_1.2,3.6947265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,power_law_1.2,5.9581951141357425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,power_law_1.2,9.262649536132812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,power_law_1.2,13.204460144042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,power_law_1.2,17.053024291992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,power_law_1.2,24.533978271484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,power_law_1.2,66.5813720703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,power_law_1.01,0.13177599906921386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,power_law_1.01,0.12830079793930055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,power_law_1.01,0.15492479801177977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,power_law_1.01,0.22169599533081055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,power_law_1.2,0.12362240552902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,power_law_1.01,0.21882240772247313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,power_law_1.2,0.13797119855880738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,power_law_1.01,0.22045440673828126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,power_law_1.2,0.15374079942703248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,power_law_1.01,0.23028481006622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,power_law_1.2,0.21661438941955566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,power_law_1.01,0.22454400062561036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,power_law_1.01,0.2329472064971924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,power_law_1.2,0.21578879356384278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,power_law_1.01,0.22885119915008545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,power_law_1.2,0.2200767993927002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,power_law_1.01,0.2339711904525757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,power_law_1.2,0.24813439846038818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,power_law_1.01,0.24749441146850587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,power_law_1.2,0.22458879947662352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,power_law_1.01,0.25077118873596194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,power_law_1.2,0.2254080057144165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,power_law_1.01,0.26202878952026365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,power_law_1.2,0.23708798885345458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,power_law_1.01,0.27779839038848875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,power_law_1.2,0.2403712034225464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,power_law_1.01,0.3056576013565063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,power_law_1.2,0.2729023933410645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,power_law_1.01,0.31077120304107664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,power_law_1.2,0.2706815958023071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,power_law_1.01,0.4094848155975342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,power_law_1.2,0.2651456117630005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,power_law_1.01,0.47646079063415525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,power_law_1.2,0.29176959991455076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,power_law_1.01,0.7277247905731201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,power_law_1.2,0.3220799922943115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,power_law_1.01,0.7588799953460693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,power_law_1.2,0.3487103939056396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,power_law_1.01,1.0818495750427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,power_law_1.2,0.4343103885650635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,power_law_1.01,1.488377571105957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,power_law_1.2,0.47560958862304686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,power_law_1.01,2.0861888885498048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,power_law_1.2,0.669209623336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,power_law_1.2,0.8723711967468262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,power_law_1.01,2.8128000259399415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,power_law_1.2,1.318227195739746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,power_law_1.01,4.324857711791992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,power_law_1.2,1.4953599929809571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,power_law_1.01,7.59222412109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,power_law_1.2,1.8869504928588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,power_law_1.01,9.240876770019531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,power_law_1.2,2.8284160614013674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,power_law_1.2,4.550387191772461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,power_law_1.01,14.06324462890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,power_law_1.2,6.293632125854492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,power_law_1.01,31.969158935546876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,power_law_1.2,9.463942718505859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,power_law_1.2,17.532806396484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,power_law_1.2,37.6641357421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.08507519960403442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.09838719964027405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.14222079515457153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,power_law_1.01,0.21021440029144287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,power_law_1.01,0.21267199516296387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,power_law_1.01,0.21307520866394042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,power_law_1.01,0.22311038970947267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,power_law_1.01,0.2128000020980835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,power_law_1.01,0.2192255973815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,power_law_1.01,0.21390080451965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,power_law_1.01,0.22885119915008545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,power_law_1.01,0.2349951982498169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,power_law_1.01,0.24379520416259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,power_law_1.01,0.2446079969406128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,power_law_1.01,0.26489601135253904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,power_law_1.01,0.27594239711761476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,power_law_1.01,0.29191040992736816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,power_law_1.01,0.3416703939437866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,power_law_1.01,0.396780800819397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,power_law_1.01,0.50348801612854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,power_law_1.01,0.6099775791168213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,power_law_1.01,0.8207167625427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,power_law_1.01,1.0431360244750976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,power_law_1.01,1.5301376342773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,power_law_1.01,1.9202880859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,power_law_1.01,2.9299583435058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,power_law_1.01,4.384236907958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,power_law_1.01,5.52435188293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.10131200551986694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,power_law_1.01,7.944678497314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.12137600183486938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,power_law_1.2,0.2092479944229126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,power_law_1.01,19.84851837158203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,power_law_1.2,0.20841600894927978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,power_law_1.2,0.21052799224853516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,power_law_1.2,0.21496961116790772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,power_law_1.2,0.21701760292053224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,power_law_1.2,0.21906559467315673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,power_law_1.2,0.2199104070663452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,power_law_1.2,0.22501120567321778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,power_law_1.2,0.24097919464111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,power_law_1.2,0.23894400596618653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,power_law_1.2,0.24364159107208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,power_law_1.2,0.2618688106536865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,power_law_1.2,0.2817471981048584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,power_law_1.2,0.2891135931015015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,power_law_1.2,0.345632004737854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,power_law_1.2,0.3975872039794922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,power_law_1.2,0.5047616004943848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,power_law_1.2,0.6153600215911865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,power_law_1.2,0.8392127990722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,power_law_1.2,1.0597760200500488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,power_law_1.2,1.5129280090332031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,power_law_1.2,1.9969087600708009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,power_law_1.2,3.076576042175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,power_law_1.2,4.4187969207763675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,power_law_1.2,5.661766433715821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,power_law_1.2,9.412908935546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,power_law_1.2,19.18865966796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,power_law_1.01,0.16803200244903566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,power_law_1.01,0.270630407333374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,power_law_1.01,0.21595520973205568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,power_law_1.01,0.21943039894104005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,power_law_1.01,0.33575680255889895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,power_law_1.2,0.16766079664230346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,power_law_1.01,0.45966081619262694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,power_law_1.2,0.2653503894805908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,power_law_1.01,0.6124415874481202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,power_law_1.2,0.134278404712677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,power_law_1.01,0.6156479835510253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,power_law_1.2,0.19776639938354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,power_law_1.01,0.6667200088500976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,power_law_1.2,0.3288383960723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,power_law_1.01,0.6917056083679199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,power_law_1.01,0.6818687915802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,power_law_1.2,0.3996351957321167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,power_law_1.01,0.7158720016479492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,power_law_1.2,0.5907584190368652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,power_law_1.01,0.7257023811340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,power_law_1.2,0.5358975887298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,power_law_1.01,0.7162816047668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,power_law_1.2,0.6556992053985595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,power_law_1.01,0.7687104225158692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,power_law_1.2,0.6823296070098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,power_law_1.01,0.795743989944458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,power_law_1.2,0.6692031860351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,power_law_1.01,0.809267234802246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,power_law_1.2,0.6941952228546142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,power_law_1.01,0.8424320220947266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,power_law_1.2,0.7211647987365722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,power_law_1.01,0.8801152229309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,power_law_1.2,0.7798143863677979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,power_law_1.01,0.9632384300231933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,power_law_1.2,0.7798143863677979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,power_law_1.01,1.046828842163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,power_law_1.2,0.8129792213439941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,power_law_1.01,1.2362496376037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,power_law_1.2,0.8482048034667968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,power_law_1.01,1.3525759696960449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,power_law_1.2,0.904319953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,power_law_1.01,1.8602815628051759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,power_law_1.2,0.9731391906738281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,power_law_1.01,2.2590208053588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,power_law_1.2,1.0912896156311036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,power_law_1.2,1.1613375663757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,power_law_1.01,3.0106367111206054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,power_law_1.2,1.3120767593383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,power_law_1.01,4.02911376953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,power_law_1.2,1.5289728164672851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,power_law_1.01,5.425171279907227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,power_law_1.2,2.057542419433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,power_law_1.01,8.419615936279296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,power_law_1.2,2.391513633728027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,power_law_1.2,3.5943679809570312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,power_law_1.01,17.267135620117188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,power_law_1.2,3.9773441314697267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,power_law_1.2,5.041843032836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,power_law_1.2,10.776025390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,power_law_1.2,22.963967895507814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,power_law_1.01,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,power_law_1.01,0.16412800550460815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,power_law_1.01,0.131769597530365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,power_law_1.01,0.2239232063293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,power_law_1.01,0.3150592088699341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,power_law_1.01,0.4303743839263916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,power_law_1.01,0.6005568027496337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,power_law_1.01,0.625542402267456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,power_law_1.01,0.6556479930877686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,power_law_1.01,0.7211391925811768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,power_law_1.01,0.7019328117370606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,power_law_1.01,0.7183167934417725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,power_law_1.01,0.7314176082611084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,power_law_1.01,0.7658304214477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,power_law_1.01,0.7854911804199218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,power_law_1.01,0.7809792041778565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,power_law_1.01,0.822316837310791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,power_law_1.01,0.8829695701599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,power_law_1.01,0.9354047775268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,power_law_1.01,1.0091263771057128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,power_law_1.01,1.0675071716308593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,power_law_1.01,1.2428159713745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,power_law_1.2,0.11359360218048095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,power_law_1.01,1.4805760383605957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,power_law_1.2,0.165830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,power_law_1.2,0.12711039781570435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,power_law_1.01,1.827507209777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,power_law_1.2,0.20616960525512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,power_law_1.01,2.2188800811767577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,power_law_1.2,0.29155840873718264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,power_law_1.01,3.012281608581543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,power_law_1.2,0.385152006149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,power_law_1.01,3.650009536743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,power_law_1.2,0.5825920104980469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,power_law_1.2,0.6231552124023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,power_law_1.01,4.381375885009765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,power_law_1.2,0.6421823978424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,power_law_1.01,7.660626983642578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,power_law_1.2,0.6782336235046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,power_law_1.2,0.6864255905151367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,power_law_1.01,17.32575378417969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,power_law_1.2,0.7224703788757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,power_law_1.2,0.7540031909942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,power_law_1.2,0.7925119876861573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,power_law_1.2,0.7945536136627197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,power_law_1.2,0.8199616432189941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,power_law_1.2,0.8699199676513671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,power_law_1.2,0.9297344207763671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,power_law_1.2,1.025158405303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,power_law_1.2,1.116703987121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,power_law_1.2,1.1306112289428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,power_law_1.2,1.3563455581665038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,power_law_1.2,1.524396800994873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,power_law_1.2,1.9473791122436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,power_law_1.2,2.4214847564697264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,power_law_1.2,3.1624639511108397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,power_law_1.2,3.9851329803466795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,power_law_1.2,4.921267318725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,power_law_1.2,9.01952667236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,power_law_1.2,19.202394104003908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.09224960207939148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.11559679508209228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,power_law_1.01,0.1319808006286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,power_law_1.01,0.22578558921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,power_law_1.01,0.3281599998474121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,power_law_1.01,0.4260672092437744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,power_law_1.01,0.08343679904937744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,power_law_1.01,0.5972928047180176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,power_law_1.01,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,power_law_1.01,0.6564799785614014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,power_law_1.01,0.07360640168190002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.11706880331039429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,power_law_1.01,0.6630144119262695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,power_law_1.01,0.10104960203170776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,power_law_1.2,0.12424319982528687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,power_law_1.01,0.12375680208206177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,power_law_1.01,0.6925055980682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,power_law_1.2,0.20103681087493896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,power_law_1.01,0.18563200235366822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,power_law_1.01,0.7154560089111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,power_law_1.2,0.2868607997894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,power_law_1.01,0.19136639833450317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,power_law_1.01,0.7371583938598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,power_law_1.01,0.19587199687957763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,power_law_1.2,0.38474240303039553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,power_law_1.01,0.7559936046600342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,power_law_1.01,0.2028287887573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,power_law_1.2,0.5969151973724365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,power_law_1.01,0.789574384689331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,power_law_1.01,0.20734720230102538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,power_law_1.01,0.7944896221160889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,power_law_1.2,0.6202688217163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,power_law_1.01,0.20918400287628175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,power_law_1.01,0.8256192207336426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,power_law_1.2,0.6556928157806396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,power_law_1.01,0.20733439922332764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,power_law_1.01,0.8743743896484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,power_law_1.2,0.6806719779968262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,power_law_1.01,0.21429119110107422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,power_law_1.01,0.9972543716430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,power_law_1.2,0.7331136226654053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,power_law_1.01,0.2169663906097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,power_law_1.01,0.9829312324523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,power_law_1.01,0.22618238925933837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,power_law_1.2,0.7380224227905273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,power_law_1.01,1.1301823616027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,power_law_1.01,0.2278208017349243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,power_law_1.2,0.769977617263794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,power_law_1.01,0.24072959423065185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,power_law_1.01,1.215379238128662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,power_law_1.2,0.7818560123443603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,power_law_1.01,0.2726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,power_law_1.01,1.441875171661377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,power_law_1.2,0.8166655540466309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,power_law_1.01,0.28945279121398926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,power_law_1.01,1.6419776916503905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,power_law_1.2,0.8621312141418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,power_law_1.01,0.3064703941345215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,power_law_1.2,0.08287360072135926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,power_law_1.01,2.103596878051758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,power_law_1.2,0.9305343627929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,power_law_1.01,0.3789695978164673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,power_law_1.2,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,power_law_1.01,2.6131263732910157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,power_law_1.2,1.050540828704834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,power_law_1.01,0.4662015914916992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,power_law_1.2,0.06340479850769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,power_law_1.2,1.0301055908203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,power_law_1.01,3.538412857055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,power_law_1.2,0.09660800099372864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,power_law_1.01,0.5505792140960694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,power_law_1.2,1.1818304061889648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,power_law_1.2,0.11216000318527222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,power_law_1.01,0.7527296066284179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,power_law_1.01,4.725632095336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,power_law_1.2,0.18628480434417724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,power_law_1.2,1.2551360130310059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,power_law_1.01,0.8940352439880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,power_law_1.01,5.778105545043945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,power_law_1.2,0.19121919870376586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,power_law_1.2,1.4681280136108399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,power_law_1.01,1.2759872436523438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,power_law_1.2,0.20145280361175538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,power_law_1.01,8.79849624633789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,power_law_1.2,1.7018239974975586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,power_law_1.01,1.6669183731079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,power_law_1.2,0.2030911922454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,power_law_1.2,0.21211519241333007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,power_law_1.2,2.1681215286254885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,power_law_1.01,2.0144960403442385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,power_law_1.01,18.235667419433593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,power_law_1.2,0.21293439865112304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,power_law_1.2,2.6541248321533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,power_law_1.01,3.4638526916503904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,power_law_1.2,0.22152318954467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,power_law_1.2,3.5196094512939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,power_law_1.2,0.23196160793304443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,power_law_1.01,7.500460815429688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,power_law_1.2,0.22152960300445557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,power_law_1.2,4.956083297729492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,power_law_1.2,0.23155839443206788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,power_law_1.2,6.046432113647461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,power_law_1.2,0.24303359985351564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,power_law_1.2,0.24159998893737794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,power_law_1.2,9.85736312866211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,power_law_1.2,0.27599999904632566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,power_law_1.2,0.29217278957366943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,power_law_1.2,0.34113919734954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,power_law_1.2,19.564877319335938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,power_law_1.2,0.39908480644226074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,power_law_1.2,0.4666751861572266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,power_law_1.2,0.608403205871582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,power_law_1.2,0.8678848266601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,power_law_1.2,0.9776512145996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,power_law_1.2,1.5912256240844727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,power_law_1.2,2.1632320404052736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,power_law_1.2,2.6442943572998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,power_law_1.2,4.450848007202149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,power_law_1.2,11.286809539794922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,power_law_1.01,0.061318397521972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,power_law_1.01,0.056409597396850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,power_law_1.01,0.0705407977104187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,power_law_1.01,0.09757440090179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,power_law_1.2,0.060102397203445436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,power_law_1.01,0.13423360586166383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,power_law_1.2,0.05106559991836548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,power_law_1.01,0.18480639457702636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,power_law_1.2,0.0650111973285675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,power_law_1.01,0.18828799724578857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,power_law_1.2,0.09962239861488342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,power_law_1.01,0.19750399589538575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,power_law_1.2,0.11703039407730102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,power_law_1.01,0.20611839294433593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,power_law_1.2,0.1860352039337158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,power_law_1.01,0.2089792013168335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,power_law_1.01,0.2083712100982666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,power_law_1.2,0.1991487979888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,power_law_1.01,0.21656959056854247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,power_law_1.2,0.20529279708862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,power_law_1.01,0.22231678962707518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,power_law_1.2,0.2075455904006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,power_law_1.01,0.2231231927871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,power_law_1.2,0.21020801067352296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,power_law_1.01,0.23520638942718505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,power_law_1.2,0.2163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,power_law_1.01,0.239302396774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,power_law_1.2,0.21797759532928468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,power_law_1.01,0.2534208059310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,power_law_1.2,0.22597761154174806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,power_law_1.01,0.28167679309844973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,power_law_1.2,0.22780799865722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,power_law_1.01,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,power_law_1.01,0.2943487882614136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,power_law_1.2,0.23928959369659425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,power_law_1.01,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,power_law_1.01,0.3435456037521362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,power_law_1.2,0.24911999702453613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,power_law_1.01,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,power_law_1.01,0.40189437866210936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,power_law_1.2,0.2544447898864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,power_law_1.01,0.12750719785690307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,power_law_1.01,0.4805439949035645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,power_law_1.2,0.2927488088607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,power_law_1.01,0.19264639616012574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,power_law_1.01,0.5628672122955323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,power_law_1.2,0.3013375997543335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,power_law_1.01,0.1998080015182495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,power_law_1.01,0.7613311767578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,power_law_1.2,0.3568448066711426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,power_law_1.01,0.21128320693969727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,power_law_1.01,0.938265609741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,power_law_1.2,0.4178624153137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,power_law_1.01,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,power_law_1.01,1.3525888442993164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,power_law_1.01,0.21762559413909913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,power_law_1.2,0.48954238891601565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,power_law_1.01,1.6632640838623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.04540160000324249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,power_law_1.01,0.22684800624847412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,power_law_1.2,0.5907135963439941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,power_law_1.01,2.1234624862670897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,power_law_1.01,0.2352447986602783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,power_law_1.2,0.8211263656616211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,power_law_1.01,3.2394176483154298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,power_law_1.01,0.23891839981079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,power_law_1.2,1.035756778717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.08759040236473084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,power_law_1.01,0.2471168041229248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.11176320314407348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,power_law_1.2,1.3402624130249023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,power_law_1.01,7.332537841796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,power_law_1.01,0.26042881011962893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,power_law_1.2,0.19223040342330933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,power_law_1.2,1.8209535598754882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,power_law_1.01,0.2712640047073364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,power_law_1.2,0.20902400016784667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,power_law_1.2,2.2176511764526365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,power_law_1.01,0.2770303964614868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,power_law_1.2,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,power_law_1.01,0.32206718921661376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,power_law_1.2,0.21782400608062744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,power_law_1.2,3.426988983154297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,power_law_1.01,0.34869120121002195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,power_law_1.2,0.22295680046081542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,power_law_1.2,7.307334136962891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,power_law_1.01,0.4261119842529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,power_law_1.2,0.23688960075378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,power_law_1.2,0.2495743989944458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,power_law_1.01,0.4564223766326904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,power_law_1.2,0.2506047964096069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,power_law_1.01,0.5833983898162842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,power_law_1.2,0.25389440059661866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,power_law_1.01,0.7200064182281494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,power_law_1.2,0.26574718952178955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,power_law_1.01,0.9547072410583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,power_law_1.2,0.2780479907989502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,power_law_1.01,1.1769087791442872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,power_law_1.2,0.28009600639343263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,power_law_1.01,1.6653631210327149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,power_law_1.2,0.32476799488067626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,power_law_1.01,2.146015930175781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,power_law_1.2,0.3618112087249756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,power_law_1.01,2.6852800369262697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,power_law_1.2,0.4318528175354004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,power_law_1.2,0.4650239944458008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,power_law_1.01,4.36748161315918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,power_law_1.2,0.6010176181793213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,power_law_1.2,0.7261504173278809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,power_law_1.01,8.842098999023438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,power_law_1.2,0.9690431594848633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,power_law_1.2,1.210092830657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,power_law_1.2,1.7001792907714843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,power_law_1.2,2.3104896545410156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,power_law_1.2,2.859552001953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,power_law_1.2,4.505318450927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,power_law_1.2,9.421075439453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,power_law_1.01,0.17397119998931884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,power_law_1.01,0.19773440361022948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,power_law_1.01,0.17970559597015381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,power_law_1.01,0.21636478900909423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,power_law_1.01,0.2931648015975952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,power_law_1.01,0.4641727924346924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,power_law_1.01,0.4813695907592773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,power_law_1.2,0.1745792031288147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,power_law_1.01,0.5157695770263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,power_law_1.2,0.12993919849395752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,power_law_1.01,0.5378943920135498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,power_law_1.01,0.5182400226593018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,power_law_1.2,0.1522495985031128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,power_law_1.01,0.5473216056823731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,power_law_1.2,0.1997696042060852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,power_law_1.01,0.5464960098266601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,power_law_1.2,0.2931519985198975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,power_law_1.01,0.5542848110198975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,power_law_1.2,0.4797311782836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,power_law_1.01,0.5796735763549805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,power_law_1.2,0.4719359874725342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,power_law_1.01,0.5960639953613281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,power_law_1.2,0.5255871772766113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,power_law_1.01,0.5993343830108643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,power_law_1.2,0.5407551765441895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,power_law_1.01,0.6210303783416748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,power_law_1.2,0.5419775962829589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,power_law_1.01,0.6785920143127442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,power_law_1.2,0.5690176010131835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,power_law_1.01,0.7670720100402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,power_law_1.2,0.5636928081512451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,power_law_1.01,0.8919936180114746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,power_law_1.2,0.6013631820678711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,power_law_1.01,0.8752063751220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,power_law_1.2,0.5903039932250976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,power_law_1.01,1.1432703971862792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,power_law_1.2,0.6243072032928467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,power_law_1.01,0.11562240123748779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,power_law_1.01,1.3685503959655763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,power_law_1.2,0.621452808380127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,power_law_1.01,0.14697599411010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,power_law_1.01,1.7185535430908203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,power_law_1.01,0.13102079629898072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,power_law_1.2,0.6600831985473633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,power_law_1.01,2.1660415649414064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,power_law_1.01,0.21763839721679687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,power_law_1.2,0.7736192226409913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,power_law_1.01,0.2868607997894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,power_law_1.2,0.8354623794555665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,power_law_1.01,2.882374382019043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,power_law_1.01,0.4625728130340576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,power_law_1.2,0.9726655960083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,power_law_1.01,4.098329544067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,power_law_1.01,0.48428797721862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,power_law_1.2,1.0517312049865724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,power_law_1.01,5.3940990447998045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,power_law_1.01,0.5006527900695801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,power_law_1.2,1.301375961303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,power_law_1.2,0.11868799924850464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,power_law_1.01,0.5047679901123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,power_law_1.01,8.842118072509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,power_law_1.2,0.10417280197143555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,power_law_1.2,1.3877951622009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,power_law_1.01,0.5334400177001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,power_law_1.2,0.12302720546722412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,power_law_1.2,1.7619840621948242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,power_law_1.01,0.5571968078613281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,power_law_1.01,18.962112426757812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,power_law_1.2,0.19634560346603394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,power_law_1.2,2.427168083190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,power_law_1.01,0.5579967975616456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,power_law_1.2,0.26042881011962893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,power_law_1.2,3.2385791778564452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,power_law_1.01,0.559225606918335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,power_law_1.2,0.4593023777008057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,power_law_1.01,0.5612864017486572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,power_law_1.2,0.4920639991760254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,power_law_1.2,4.392422485351562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,power_law_1.2,0.5121344089508056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,power_law_1.01,0.59650559425354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,power_law_1.2,6.509645080566406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,power_law_1.2,0.5305727958679199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,power_law_1.01,0.6034687995910645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,power_law_1.2,0.5387519836425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,power_law_1.01,0.6434112071990967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,power_law_1.2,12.135289764404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,power_law_1.2,0.5625216007232666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,power_law_1.01,0.6966591835021972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,power_law_1.2,0.5518720149993896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,power_law_1.01,0.7658751964569092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,power_law_1.2,26.120709228515626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,power_law_1.2,0.5764351844787597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,power_law_1.01,0.9235712051391601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,power_law_1.2,0.5961023807525635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,power_law_1.01,0.9034432411193848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,power_law_1.2,0.6010303974151612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,power_law_1.01,1.1003071784973144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,power_law_1.2,0.6268223762512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,power_law_1.01,1.2715264320373536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,power_law_1.2,0.6704512119293213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,power_law_1.01,1.6542911529541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,power_law_1.2,0.745798397064209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,power_law_1.01,2.052230453491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,power_law_1.2,0.8080639839172363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,power_law_1.01,2.724985694885254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,power_law_1.2,0.9649408340454102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,power_law_1.01,3.649260711669922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,power_law_1.2,0.9202303886413574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,power_law_1.2,1.139641571044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,power_law_1.01,4.312607955932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,power_law_1.2,1.406707191467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,power_law_1.01,8.121689605712891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,power_law_1.2,1.7198400497436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,power_law_1.2,2.2323904037475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,power_law_1.01,15.5214599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,power_law_1.2,3.0676223754882814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,power_law_1.2,4.486886215209961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,power_law_1.2,5.398566436767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,power_law_1.2,9.438349151611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,power_law_1.2,20.11328582763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.11027840375900269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,power_law_1.01,0.13752959966659545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,power_law_1.01,0.21800320148468016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,power_law_1.01,0.2866111993789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,power_law_1.01,0.45795202255249023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,power_law_1.01,0.48956799507141113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,power_law_1.01,0.5178304195404053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,power_law_1.01,0.5407487869262695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,power_law_1.01,0.5383103847503662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,power_law_1.01,0.5608384132385253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,power_law_1.01,0.5731200218200684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.088128000497818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,power_law_1.01,0.5821248054504394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.09838079810142517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,power_law_1.01,0.6087615966796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,power_law_1.2,0.1340288043022156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,power_law_1.01,0.6288256168365478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,power_law_1.2,0.19586559534072875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,power_law_1.01,0.6499263763427734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,power_law_1.2,0.2556864023208618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,power_law_1.01,0.6781888008117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,power_law_1.2,0.4571968078613281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,power_law_1.01,0.7580543994903565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,power_law_1.2,0.4965184211730957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,power_law_1.01,0.7986112117767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,power_law_1.2,0.531334400177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,power_law_1.01,0.9321344375610352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,power_law_1.2,0.5309311866760253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,power_law_1.01,0.9616191864013672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,power_law_1.2,0.5612224102020263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,power_law_1.01,0.16417280435562134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,power_law_1.01,1.1780672073364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,power_law_1.2,0.5763967990875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,power_law_1.01,0.26883199214935305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,power_law_1.01,1.4070591926574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,power_law_1.2,0.5882815837860107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,power_law_1.2,0.5899072170257569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,power_law_1.01,0.4887807846069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,power_law_1.01,1.8135808944702148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,power_law_1.2,0.6185728073120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,power_law_1.01,2.26231689453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,power_law_1.01,0.22049920558929442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,power_law_1.2,0.6392576217651367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,power_law_1.01,3.1470272064208986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,power_law_1.01,0.3706239938735962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,power_law_1.2,0.6519616127014161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,power_law_1.01,4.427865600585937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,power_law_1.01,0.5280960083007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,power_law_1.2,0.16745599508285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,power_law_1.2,0.6765439987182618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,power_law_1.01,0.6446400165557862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,power_law_1.2,0.2653439998626709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,power_law_1.2,0.7691071987152099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,power_law_1.01,0.7675199985504151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,power_law_1.2,0.8248127937316895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,power_law_1.2,0.25265278816223147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,power_law_1.2,0.9505536079406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,power_law_1.01,0.8512895584106446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,power_law_1.2,0.20882558822631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,power_law_1.2,0.9743103981018066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,power_law_1.2,0.3407167911529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,power_law_1.01,0.8936575889587403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,power_law_1.2,1.1870976448059083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,power_law_1.01,0.911680030822754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,power_law_1.2,0.478547191619873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,power_law_1.2,1.414022445678711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,power_law_1.01,0.9493696212768554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,power_law_1.2,0.5702976226806641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,power_law_1.2,1.8369279861450196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,power_law_1.01,0.9600383758544921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,power_law_1.2,0.7249279975891113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,power_law_1.2,2.2500160217285154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,power_law_1.01,0.9755904197692871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,power_law_1.2,0.8334464073181153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,power_law_1.2,3.1085248947143556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,power_law_1.2,0.7970111846923829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,power_law_1.01,1.023532772064209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,power_law_1.2,4.55931510925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,power_law_1.2,0.885478401184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,power_law_1.01,1.0132736206054687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,power_law_1.2,5.706035232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,power_law_1.2,0.9370944023132324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,power_law_1.01,1.0708288192749023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,power_law_1.2,8.629727935791015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,power_law_1.2,0.9203071594238281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,power_law_1.01,1.1318464279174805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,power_law_1.2,0.9366847991943359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,power_law_1.01,1.1793791770935058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,power_law_1.2,19.042387390136717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,power_law_1.2,0.9379136085510253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,power_law_1.01,1.349779224395752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,power_law_1.2,1.0353983879089355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,power_law_1.01,1.4574272155761718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,power_law_1.2,1.086400032043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,power_law_1.01,1.707961654663086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,power_law_1.2,1.150284767150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,power_law_1.01,1.7517887115478517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,power_law_1.2,1.2346688270568849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,power_law_1.01,2.0235519409179688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,power_law_1.2,1.3698368072509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,power_law_1.01,2.5423295974731444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,power_law_1.2,1.6088384628295898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,power_law_1.01,3.305388641357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,power_law_1.2,1.9145984649658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,power_law_1.01,4.35560302734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,power_law_1.2,1.8296127319335938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,power_law_1.01,5.246892929077148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,power_law_1.2,2.290617561340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,power_law_1.01,8.657234954833985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,power_law_1.2,2.9189504623413085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,power_law_1.2,3.440972900390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,power_law_1.01,18.706521606445314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,power_law_1.2,5.279878234863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,power_law_1.2,6.2768512725830075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,power_law_1.2,9.628211212158202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,power_law_1.2,19.40953674316406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,power_law_1.01,5.484627151489258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,power_law_1.01,8.2504638671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,power_law_1.01,18.042169189453126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,power_law_1.01,0.11598720550537109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,power_law_1.01,0.16739840507507325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,power_law_1.01,0.2681663990020752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,power_law_1.01,0.20734078884124757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,power_law_1.01,0.354803204536438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,power_law_1.01,0.5108479976654052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,power_law_1.01,0.5919616222381592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,power_law_1.01,0.792460823059082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,power_law_1.01,0.8596351623535157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,power_law_1.01,0.8432512283325195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,power_law_1.01,0.8981120109558105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,power_law_1.01,0.954252815246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,power_law_1.01,0.9780032157897949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,power_law_1.01,0.975551986694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,power_law_1.01,1.0345279693603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,power_law_1.01,1.0476351737976075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,power_law_1.2,0.11276160478591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,power_law_1.01,1.0728256225585937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,power_law_1.2,0.16725120544433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,power_law_1.01,1.1768575668334962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,power_law_1.2,0.20636160373687745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,power_law_1.01,1.1895551681518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,power_law_1.2,0.2088320016860962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,power_law_1.01,1.3427647590637206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,power_law_1.2,0.3347775936126709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,power_law_1.01,1.434886360168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,power_law_1.2,0.4482304096221924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,power_law_1.01,1.6714496612548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,power_law_1.2,0.558835220336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,power_law_1.01,1.6903039932250976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,power_law_1.2,0.7589183807373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,power_law_1.01,2.1119680404663086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,power_law_1.2,0.7814464092254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,power_law_1.01,2.524025535583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,power_law_1.2,0.8203583717346191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,power_law_1.01,3.2553665161132814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,power_law_1.2,0.874022388458252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,power_law_1.01,4.630604934692383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,power_law_1.2,0.8944895744323731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,power_law_1.2,0.9645376205444336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,power_law_1.01,5.388358306884766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,power_law_1.2,0.9813183784484864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,power_law_1.01,8.182240295410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.11585919857025147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,power_law_1.2,1.0259712219238282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,power_law_1.01,0.1729920029640198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,power_law_1.2,1.0321279525756837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,power_law_1.01,16.741049194335936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,power_law_1.01,0.20432639122009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,power_law_1.2,1.0953920364379883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,power_law_1.01,0.3525887966156006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,power_law_1.2,1.1654335975646972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,power_law_1.01,0.5276991844177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,power_law_1.2,1.248192024230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,power_law_1.01,0.5952767848968505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,power_law_1.2,1.4262911796569824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,power_law_1.01,0.802342414855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,power_law_1.2,1.4785792350769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,power_law_1.01,0.8125823974609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,power_law_1.2,1.7231103897094726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,power_law_1.01,0.8924544334411622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,power_law_1.2,1.8607295989990233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,power_law_1.01,0.9252160072326661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,power_law_1.2,2.3072063446044924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,power_law_1.01,0.955942440032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,power_law_1.2,2.7424127578735353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,power_law_1.01,0.9682175636291503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,power_law_1.2,3.5915008544921876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,power_law_1.01,1.0071295738220214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,power_law_1.2,4.715865707397461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,power_law_1.01,1.038271999359131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,power_law_1.2,5.862527847290039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,power_law_1.01,1.0777983665466309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,power_law_1.01,1.1441472053527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,power_law_1.2,9.434854125976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,power_law_1.01,1.2723584175109863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,power_law_1.01,1.3649279594421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,power_law_1.2,20.810418701171876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,power_law_1.01,1.5546048164367676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,power_law_1.01,1.5547072410583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,power_law_1.01,1.8315967559814452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,power_law_1.01,2.117350387573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,power_law_1.01,2.6319488525390624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,power_law_1.01,3.066815948486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,power_law_1.01,3.985273742675781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,power_law_1.01,5.2454784393310545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,power_law_1.01,6.31446418762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,power_law_1.01,9.55159683227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,power_law_1.01,19.527615356445313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,power_law_1.01,0.09408000111579895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,power_law_1.01,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,power_law_1.01,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,power_law_1.01,0.09326080083847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,power_law_1.01,0.09528959989547729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,power_law_1.01,0.09633280038833618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,power_law_1.01,0.09837440252304078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,power_law_1.01,0.09960960149765015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,power_law_1.01,0.10576640367507935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,power_law_1.01,0.10658559799194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,power_law_1.01,0.1102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,power_law_1.01,0.11681920289993286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,power_law_1.01,0.1340288043022156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,power_law_1.01,0.14405759572982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,power_law_1.01,0.1549056053161621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,power_law_1.01,0.16309759616851807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,power_law_1.01,0.2081536054611206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,power_law_1.01,0.2751039981842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,power_law_1.01,0.34434559345245364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,power_law_1.01,0.3930943965911865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,power_law_1.01,0.6818560123443603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,power_law_1.01,0.7273215770721435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,power_law_1.01,0.9427776336669922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,power_law_1.01,1.5063872337341309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,power_law_1.01,2.0144895553588866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,power_law_1.01,3.416767883300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,power_law_1.01,3.5437313079833985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,power_law_1.2,0.11932159662246704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,power_law_1.01,6.488543701171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,power_law_1.2,0.08307200074195861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,power_law_1.2,0.08737919926643371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,power_law_1.01,16.220851135253906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,power_law_1.2,0.09168639779090881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,power_law_1.2,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,power_law_1.2,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,power_law_1.2,0.09537919759750366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,power_law_1.2,0.09617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,power_law_1.2,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,power_law_1.2,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,power_law_1.2,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,power_law_1.2,0.1121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,power_law_1.2,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,power_law_1.2,0.11891839504241944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,power_law_1.2,0.1477952003479004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,power_law_1.2,0.14370559453964232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,power_law_1.2,0.18090239763259888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,power_law_1.2,0.210265588760376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,power_law_1.2,0.2645312070846558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,power_law_1.2,0.3274048089981079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,power_law_1.01,0.05748479962348938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,power_law_1.2,0.4351232051849365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,power_law_1.01,0.06793599724769592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,power_law_1.2,0.5952832221984863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,power_law_1.01,0.06627839803695679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.09388160109519958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,power_law_1.2,0.8813823699951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,power_law_1.01,0.08615679740905761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,power_law_1.2,1.1916543960571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,power_law_1.01,0.0877888023853302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.11886719465255738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,power_law_1.01,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,power_law_1.2,1.5662336349487305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,power_law_1.2,0.14199039936065674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,power_law_1.01,0.0896511971950531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,power_law_1.2,2.3334144592285155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,power_law_1.01,0.09473919868469238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,power_law_1.2,0.2065279960632324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,power_law_1.2,3.6853057861328127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,power_law_1.01,0.09782400131225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,power_law_1.2,0.32468481063842775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,power_law_1.2,4.2548480987548825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,power_law_1.01,0.09742720127105713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,power_law_1.2,0.44982399940490725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,power_law_1.01,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,power_law_1.2,7.651987457275391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,power_law_1.01,0.10643199682235718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,power_law_1.2,0.5407551765441895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,power_law_1.01,0.10766079425811767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,power_law_1.2,18.22406463623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,power_law_1.01,0.11380480527877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,power_law_1.2,0.7780672073364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,power_law_1.01,0.12773120403289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,power_law_1.2,0.8174336433410645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,power_law_1.01,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,power_law_1.01,0.15066239833831788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,power_law_1.2,0.8407999992370605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,power_law_1.01,0.19570560455322267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,power_law_1.2,0.8866496086120605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,power_law_1.01,0.20266880989074706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,power_law_1.01,0.27150719165802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,power_law_1.2,0.9321215629577637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,power_law_1.01,0.2911616086959839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,power_law_1.2,0.9607935905456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,power_law_1.01,0.42182397842407227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,power_law_1.01,0.4871551990509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,power_law_1.2,1.025932788848877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,power_law_1.01,0.7372159957885742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,power_law_1.2,1.044364833831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,power_law_1.01,0.9980799674987793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,power_law_1.2,1.076531219482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,power_law_1.01,1.5703231811523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,power_law_1.01,1.9007040023803712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,power_law_1.2,1.1527104377746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,power_law_1.01,2.7641088485717775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,power_law_1.2,1.3046272277832032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,power_law_1.2,0.060288000106811526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,power_law_1.01,4.075046539306641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,power_law_1.2,1.3939647674560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,power_law_1.2,0.0674560010433197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,power_law_1.01,7.883699035644531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,power_law_1.2,0.07441920042037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,power_law_1.2,1.638688087463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,power_law_1.2,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,power_law_1.2,0.09015039801597595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,power_law_1.2,1.6083776473999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,power_law_1.2,0.09428480267524719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,power_law_1.2,1.9120960235595703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,power_law_1.2,0.09448959827423095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,power_law_1.2,0.0967423975467682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,power_law_1.2,2.2176511764526365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,power_law_1.2,0.09591680169105529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,power_law_1.2,0.10083839893341065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,power_law_1.2,2.7382528305053713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,power_law_1.2,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,power_law_1.2,3.061030387878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,power_law_1.2,0.1059648036956787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,power_law_1.2,0.10534399747848511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,power_law_1.2,4.022963333129883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,power_law_1.2,0.10707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,power_law_1.2,0.12337919473648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,power_law_1.2,5.3699390411376955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,power_law_1.2,0.12951040267944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,power_law_1.2,0.14487040042877197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,power_law_1.2,6.483634948730469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,power_law_1.2,0.1794816017150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,power_law_1.2,0.20385279655456542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,power_law_1.2,9.847686767578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,power_law_1.2,0.22864000797271727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,power_law_1.2,0.3203775882720947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,power_law_1.2,0.44854397773742677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,power_law_1.2,19.824922180175783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,power_law_1.2,0.4911935806274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,power_law_1.2,0.7338816165924072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,power_law_1.2,1.1133824348449708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,power_law_1.2,1.4610560417175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,power_law_1.2,2.1537664413452147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,power_law_1.2,2.6557119369506834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,power_law_1.2,4.387897491455078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,power_law_1.01,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,power_law_1.01,0.06034560203552246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,power_law_1.2,8.749139404296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,power_law_1.01,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,power_law_1.01,0.08636800050735474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,power_law_1.01,0.08792960047721862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,power_law_1.01,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,power_law_1.01,0.09167360067367554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,power_law_1.01,0.09188479781150818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,power_law_1.01,0.09405440092086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,power_law_1.01,0.09742079973220825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,power_law_1.01,0.10267519950866699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,power_law_1.01,0.114956796169281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,power_law_1.01,0.11953279972076417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,power_law_1.01,0.12936320304870605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,power_law_1.01,0.15168639421463012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,power_law_1.01,0.17404799461364745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,power_law_1.01,0.21619839668273927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,power_law_1.01,0.25880320072174073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,power_law_1.2,0.04580479860305786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,power_law_1.01,0.3382591962814331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,power_law_1.01,0.4148543834686279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,power_law_1.2,0.0624064028263092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,power_law_1.01,0.5858687877655029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,power_law_1.2,0.08432000279426574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,power_law_1.01,0.7429440021514893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,power_law_1.2,0.08553599715232849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,power_law_1.2,0.08739200234413147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,power_law_1.01,1.0700160026550294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,power_law_1.2,0.08882560133934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,power_law_1.01,1.4091520309448242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,power_law_1.2,0.0904640018939972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,power_law_1.01,1.7808704376220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,power_law_1.2,0.09415040016174317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,power_law_1.01,2.896806335449219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,power_law_1.2,0.09414399862289428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,power_law_1.2,0.09333119988441467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,power_law_1.01,6.122828674316406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,power_law_1.2,0.09673600196838379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,power_law_1.2,0.09905920028686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,power_law_1.2,0.10417280197143555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,power_law_1.2,0.11708799600601197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,power_law_1.2,0.11707520484924316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,power_law_1.2,0.12896000146865844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,power_law_1.2,0.15251200199127196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,power_law_1.2,0.17196799516677858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,power_law_1.2,0.22193920612335205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,power_law_1.2,0.2592128038406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,power_law_1.2,0.3429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,power_law_1.2,0.4246848106384277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,power_law_1.2,0.5940608024597168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,power_law_1.2,0.7605311870574951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,power_law_1.2,1.0958208084106444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,power_law_1.2,1.4570560455322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,power_law_1.2,1.8414272308349608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,power_law_1.2,3.2496257781982423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,power_law_1.2,6.295686340332031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,power_law_1.01,0.15820159912109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,power_law_1.01,0.1074112057685852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,power_law_1.01,0.11273599863052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,power_law_1.01,0.1307584047317505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,power_law_1.01,0.1307584047317505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,power_law_1.01,0.13362560272216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,power_law_1.01,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,power_law_1.01,0.13771519660949708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,power_law_1.01,0.13772159814834595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,power_law_1.2,0.1352255940437317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,power_law_1.01,0.1426367998123169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,power_law_1.2,0.13768320083618163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,power_law_1.01,0.14243839979171752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,power_law_1.2,0.11190400123596192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,power_law_1.01,0.14897279739379882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,power_law_1.2,0.13157119750976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,power_law_1.01,0.16167680025100709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,power_law_1.2,0.13032959699630736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,power_law_1.01,0.18213759660720824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,power_law_1.2,0.13236479759216307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,power_law_1.01,0.20181760787963868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,power_law_1.2,0.1360640048980713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,power_law_1.01,0.2517888069152832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,power_law_1.2,0.1372928023338318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,power_law_1.01,0.22906880378723143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,power_law_1.01,0.27370240688323977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,power_law_1.2,0.14396159648895263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,power_law_1.01,0.37445759773254395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,power_law_1.2,0.148364794254303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,power_law_1.01,0.45569920539855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,power_law_1.2,0.14261759519577027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,power_law_1.01,0.7117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,power_law_1.2,0.15407999753952026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,power_law_1.2,0.16289279460906983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,power_law_1.01,0.998476791381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,power_law_1.2,0.17396479845046997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,power_law_1.01,1.243622398376465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,power_law_1.2,0.2081536054611206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,power_law_1.01,1.7009599685668946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,power_law_1.2,0.24174079895019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,power_law_1.01,2.5455360412597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,power_law_1.2,0.2425600051879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,power_law_1.01,2.9115135192871096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,power_law_1.2,0.3199680089950562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,power_law_1.01,5.62224006652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,power_law_1.2,0.3623487949371338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,power_law_1.01,6.619001770019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,power_law_1.2,0.509222412109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,power_law_1.2,0.587443208694458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,power_law_1.01,14.132722473144531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,power_law_1.2,0.953433609008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,power_law_1.2,1.2051263809204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,power_law_1.2,1.961248016357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,power_law_1.01,30.259506225585938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,power_law_1.2,2.2938304901123048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,power_law_1.01,0.07324159741401673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,power_law_1.2,3.699590301513672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,power_law_1.01,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,power_law_1.01,0.08450559973716736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,power_law_1.2,6.55633316040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,power_law_1.01,0.12977919578552247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,power_law_1.2,6.493459320068359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,power_law_1.01,0.12198400497436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,power_law_1.01,0.12854399681091308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,power_law_1.2,12.162751770019531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,power_law_1.01,0.12976640462875366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,power_law_1.01,0.13223040103912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,power_law_1.2,21.479930114746093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,power_law_1.01,0.13715200424194335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,power_law_1.01,0.14042240381240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,power_law_1.01,0.14369920492172242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,power_law_1.01,0.14902399778366088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,power_law_1.01,0.1550976037979126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,power_law_1.01,0.15598080158233643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,power_law_1.01,0.1828160047531128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,power_law_1.01,0.1842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,power_law_1.01,0.20186240673065187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,power_law_1.01,0.24159998893737794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,power_law_1.01,0.2985152006149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,power_law_1.2,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,power_law_1.01,0.37511680126190183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,power_law_1.2,0.07284479737281799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,power_law_1.01,0.43349761962890626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,power_law_1.2,0.08513919711112976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,power_law_1.01,0.6835584163665771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,power_law_1.2,0.1273151993751526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,power_law_1.01,0.9522496223449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,power_law_1.2,0.12711679935455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,power_law_1.01,1.4193984031677247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,power_law_1.2,0.12896640300750734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,power_law_1.01,1.523641586303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,power_law_1.2,0.12917120456695558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,power_law_1.01,2.502579116821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,power_law_1.2,0.13736319541931152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,power_law_1.01,3.776633453369141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,power_law_1.2,0.1424831986427307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,power_law_1.01,4.721184158325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,power_law_1.2,0.14678399562835692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,power_law_1.2,0.13979519605636598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,power_law_1.01,7.021478271484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,power_law_1.2,0.15107840299606323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,power_law_1.2,0.1559872031211853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,power_law_1.01,17.26275177001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,power_law_1.2,0.1588544011116028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,power_law_1.2,0.18138240575790404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,power_law_1.2,0.1924415946006775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,power_law_1.2,0.20514559745788574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,power_law_1.2,0.24078080654144288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,power_law_1.2,0.31449599266052247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,power_law_1.2,0.4070720195770264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,power_law_1.2,0.47322878837585447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,power_law_1.2,0.6815167903900147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,power_law_1.2,0.6962560176849365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,power_law_1.2,1.3288703918457032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,power_law_1.2,1.5912256240844727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,power_law_1.2,2.5755008697509765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,power_law_1.2,3.709446334838867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,power_law_1.2,4.14384651184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,power_law_1.2,8.3700927734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,power_law_1.2,15.446925354003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,power_law_1.01,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,power_law_1.01,0.09389439821243287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,power_law_1.01,0.1220736026763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,power_law_1.01,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,power_law_1.01,0.12911360263824462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,power_law_1.01,0.131167995929718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,power_law_1.01,0.1332159996032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,power_law_1.01,0.13301119804382325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,power_law_1.2,0.05824000239372253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,power_law_1.01,0.1354688048362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,power_law_1.2,0.07132160067558288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,power_law_1.01,0.13607679605484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,power_law_1.2,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,power_law_1.01,0.1414080023765564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,power_law_1.2,0.1217344045639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,power_law_1.01,0.1493888020515442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,power_law_1.2,0.12437759637832642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,power_law_1.01,0.16556799411773682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,power_law_1.2,0.12541439533233642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,power_law_1.01,0.17130240201950073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,power_law_1.2,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,power_law_1.01,0.12588160037994384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,power_law_1.01,0.18439040184020997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,power_law_1.2,0.1286911964416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,power_law_1.01,0.1647744059562683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,power_law_1.01,0.21878399848937988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,power_law_1.2,0.12972160577774047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,power_law_1.01,0.11216000318527222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,power_law_1.01,0.2542527914047241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,power_law_1.2,0.13483519554138185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,power_law_1.01,0.30954880714416505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,power_law_1.2,0.1350335955619812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,power_law_1.01,0.1449280023574829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,power_law_1.01,0.37363200187683104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,power_law_1.2,0.13728640079498292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,power_law_1.01,0.19960319995880127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,power_law_1.01,0.49898881912231446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,power_law_1.2,0.1391167998313904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,power_law_1.01,0.2479423999786377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,power_law_1.01,0.6185664176940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,power_law_1.2,0.1503999948501587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,power_law_1.2,0.16494079828262329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,power_law_1.01,0.8780608177185059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,power_law_1.01,0.3290431976318359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,power_law_1.2,0.1737280011177063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,power_law_1.01,1.123200035095215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,power_law_1.01,0.35525760650634763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,power_law_1.2,0.1835904002189636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,power_law_1.01,1.6669631958007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,power_law_1.01,0.3659071922302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,power_law_1.2,0.2184000015258789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,power_law_1.01,2.4050559997558594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,power_law_1.2,0.25156478881835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,power_law_1.01,0.3630336046218872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,power_law_1.01,2.9790975570678713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,power_law_1.2,0.3138432025909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,power_law_1.01,0.38453121185302735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,power_law_1.01,4.584729766845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,power_law_1.2,0.3709696054458618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,power_law_1.01,0.4033792018890381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,power_law_1.2,0.5055359840393067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,power_law_1.2,0.10826879739761353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,power_law_1.01,9.513037109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,power_law_1.2,0.6152959823608398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,power_law_1.01,0.4236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,power_law_1.2,0.15946240425109864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,power_law_1.2,0.8678144454956055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,power_law_1.01,0.4236608028411865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,power_law_1.2,0.09616000056266785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,power_law_1.2,1.1129664421081542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,power_law_1.01,0.435532808303833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,power_law_1.2,0.1375488042831421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,power_law_1.2,1.6349952697753907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,power_law_1.01,0.45150079727172854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,power_law_1.2,0.18381439447402953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,power_law_1.2,2.1996288299560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,power_law_1.01,0.4719871997833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,power_law_1.2,2.8201791763305666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,power_law_1.2,0.23052799701690674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,power_law_1.01,0.508454418182373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,power_law_1.2,4.456940841674805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,power_law_1.2,0.3319231986999512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,power_law_1.01,0.5346303939819336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,power_law_1.2,0.34101119041442873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,power_law_1.2,9.375212860107421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,power_law_1.2,0.3634432077407837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,power_law_1.01,0.6157567977905274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,power_law_1.2,0.37553279399871825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,power_law_1.01,0.6437503814697265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,power_law_1.2,0.3882240056991577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,power_law_1.01,0.7702911853790283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,power_law_1.2,0.39969921112060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,power_law_1.01,0.9321727752685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,power_law_1.2,0.41648640632629397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,power_law_1.01,1.18919677734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,power_law_1.2,0.4310463905334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,power_law_1.01,1.4282879829406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,power_law_1.2,0.4400383949279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,power_law_1.01,1.9178815841674806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,power_law_1.2,0.4605247974395752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,power_law_1.01,2.5369792938232423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,power_law_1.2,0.4806079864501953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,power_law_1.01,3.098355293273926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,power_law_1.2,0.5248256206512452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,power_law_1.2,0.5649727821350098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,power_law_1.01,4.359711837768555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,power_law_1.2,0.6495552062988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,power_law_1.2,0.6897024154663086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,power_law_1.01,9.691673278808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,power_law_1.2,0.8232255935668945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,power_law_1.2,0.9485631942749023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,power_law_1.2,1.21212797164917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,power_law_1.2,1.4777600288391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,power_law_1.2,2.02806396484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,power_law_1.2,2.541062355041504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,power_law_1.2,3.27457275390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,power_law_1.2,4.945369720458984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,power_law_1.2,11.907417297363281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,power_law_1.01,0.08570240139961242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,power_law_1.01,0.11600639820098876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,power_law_1.01,0.09717119932174682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,power_law_1.01,0.1401792049407959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,power_law_1.01,0.19629440307617188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,power_law_1.01,0.24564480781555176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,power_law_1.01,0.3419071912765503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,power_law_1.01,0.37262721061706544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,power_law_1.01,0.3605439901351929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,power_law_1.2,0.08732159733772278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,power_law_1.01,0.3799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,power_law_1.2,0.11578880548477173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,power_law_1.01,0.4060031890869141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,power_law_1.2,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,power_law_1.01,0.4178880214691162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,power_law_1.2,0.1377087950706482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,power_law_1.01,0.4268799781799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,power_law_1.2,0.17456640005111695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,power_law_1.01,0.4350912094116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,power_law_1.2,0.23048319816589355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,power_law_1.01,0.45392642021179197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,power_law_1.2,0.3377919912338257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,power_law_1.01,0.46662402153015137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,power_law_1.2,0.35704960823059084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,power_law_1.01,0.4838143825531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,power_law_1.2,0.3590912103652954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,power_law_1.01,0.5169919967651367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,power_law_1.2,0.3767103910446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,power_law_1.01,0.5641151905059815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,power_law_1.2,0.4023104190826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,power_law_1.01,0.6325056076049804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,power_law_1.2,0.40579838752746583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,power_law_1.01,0.7117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,power_law_1.2,0.43999361991882324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,power_law_1.01,0.8584128379821777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,power_law_1.2,0.440396785736084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,power_law_1.2,0.46005759239196775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,power_law_1.01,0.9672831535339356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,power_law_1.2,0.4682432174682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,power_law_1.01,1.268607997894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,power_law_1.2,0.5022463798522949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,power_law_1.01,1.527289581298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,power_law_1.2,0.5477183818817138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,power_law_1.01,2.091436767578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,power_law_1.2,0.5862143993377685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,power_law_1.01,2.729452705383301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,power_law_1.2,0.6564544200897217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,power_law_1.01,3.2619327545166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,power_law_1.2,0.7318272113800048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,power_law_1.01,5.187475204467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,power_law_1.2,0.884614372253418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,power_law_1.2,1.0164992332458496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,power_law_1.01,0.07343999743461609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,power_law_1.01,10.516146850585937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,power_law_1.2,1.2684032440185546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,power_law_1.01,0.09105920195579528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,power_law_1.2,1.5805184364318847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,power_law_1.01,0.1035647988319397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,power_law_1.01,0.15798399448394776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,power_law_1.2,2.1652223587036135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,power_law_1.01,0.21374080181121827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,power_law_1.2,2.8877695083618162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,power_law_1.01,0.2737344026565552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,power_law_1.2,3.3176319122314455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,power_law_1.01,0.3697920083999634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,power_law_1.2,5.597267150878906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,power_law_1.01,0.3867775917053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,power_law_1.01,0.4095295906066895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,power_law_1.2,11.933574676513672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,power_law_1.01,0.41422719955444337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,power_law_1.2,0.06976640224456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,power_law_1.01,0.4347072124481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,power_law_1.2,0.09107199907302857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,power_law_1.01,0.4502719879150391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,power_law_1.2,0.10152319669723511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,power_law_1.01,0.45273599624633787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,power_law_1.2,0.14410879611968994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,power_law_1.01,0.5227839946746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,power_law_1.2,0.18751360177993776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,power_law_1.01,0.5530879974365235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,power_law_1.2,0.2532671928405762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,power_law_1.01,0.5555456161499024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,power_law_1.2,0.3649087905883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,power_law_1.01,0.5440703868865967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,power_law_1.2,0.38353919982910156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,power_law_1.2,0.40049920082092283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,power_law_1.01,0.6083327770233155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,power_law_1.2,0.4259200096130371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,power_law_1.01,0.6741375923156738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,power_law_1.2,0.4531519889831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,power_law_1.01,0.7929088115692139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,power_law_1.01,0.0779263973236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,power_law_1.2,0.47322878837585447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,power_law_1.01,0.8502464294433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,power_law_1.01,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,power_law_1.2,0.49779839515686036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,power_law_1.01,1.0411264419555664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,power_law_1.01,0.07157120108604431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,power_law_1.2,0.48959999084472655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,power_law_1.01,1.2752320289611816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,power_law_1.01,0.08752639889717102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,power_law_1.2,0.5129663944244385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,power_law_1.01,1.6202943801879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,power_law_1.01,0.11847039461135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,power_law_1.2,0.525651216506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,power_law_1.01,0.11847039461135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,power_law_1.01,1.965388870239258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,power_law_1.2,0.5571839809417725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,power_law_1.01,0.12420480251312256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,power_law_1.01,2.692633628845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,power_law_1.01,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,power_law_1.2,0.6239552021026611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,power_law_1.01,3.3742145538330077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,power_law_1.01,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,power_law_1.2,0.6847936153411865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,power_law_1.2,0.07359359860420227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,power_law_1.01,0.13055360317230225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,power_law_1.01,4.126233673095703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,power_law_1.2,0.8002559661865234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,power_law_1.2,0.04431360065937042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,power_law_1.01,0.1301375985145569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,power_law_1.2,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,power_law_1.2,0.878105640411377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,power_law_1.01,0.13382400274276735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,power_law_1.01,6.454573059082032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,power_law_1.2,0.07278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,power_law_1.2,1.0577152252197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,power_law_1.01,0.1387392044067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,power_law_1.2,0.08321920037269592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,power_law_1.01,0.14959360361099244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,power_law_1.2,1.2973440170288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,power_law_1.01,12.616012573242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,power_law_1.2,0.1170240044593811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,power_law_1.01,0.14978560209274291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,power_law_1.2,1.645248031616211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,power_law_1.2,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,power_law_1.01,0.15492479801177977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,power_law_1.2,1.9920255661010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,power_law_1.2,0.12151679992675782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,power_law_1.01,0.1755903959274292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,power_law_1.2,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,power_law_1.01,0.19219839572906494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,power_law_1.2,2.6971456527709963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,power_law_1.2,0.1254207968711853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,power_law_1.01,0.2378688097000122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,power_law_1.2,3.4053375244140627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,power_law_1.2,0.1323904037475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,power_law_1.01,0.2581376075744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,power_law_1.2,4.162700653076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,power_law_1.2,0.14056960344314576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,power_law_1.01,0.31958398818969724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,power_law_1.2,0.1383296012878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,power_law_1.01,0.41541118621826173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,power_law_1.2,6.31207046508789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,power_law_1.2,0.14507520198822021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,power_law_1.01,0.523967981338501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,power_law_1.2,0.15205119848251342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,power_law_1.01,0.7064511775970459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,power_law_1.2,13.086860656738281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,power_law_1.2,0.15695359706878662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,power_law_1.01,0.9050944328308106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,power_law_1.2,0.1624768018722534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,power_law_1.01,1.226841640472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,power_law_1.2,0.1719040036201477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,power_law_1.01,1.4459391593933106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,power_law_1.2,0.19464319944381714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,power_law_1.01,2.1848896026611326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,power_law_1.2,0.23887360095977783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,power_law_1.2,0.2585344076156616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,power_law_1.01,4.654348754882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,power_law_1.2,0.32427520751953126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,power_law_1.2,0.42524161338806155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,power_law_1.2,0.5878592014312745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,power_law_1.2,0.718726396560669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,power_law_1.2,0.955891227722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,power_law_1.2,1.2821248054504395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,power_law_1.2,1.6804672241210938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,power_law_1.01,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,power_law_1.2,2.5611007690429686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,power_law_1.01,0.05443199872970581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,power_law_1.2,5.322828674316407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,power_law_1.01,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,power_law_1.01,0.08922240138053894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,power_law_1.01,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,power_law_1.01,0.1252671957015991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,power_law_1.01,0.12670079469680787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,power_law_1.01,0.13059200048446656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,power_law_1.01,0.1318079948425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,power_law_1.01,0.14001280069351196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,power_law_1.01,0.13878400325775148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,power_law_1.01,0.14450559616088868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,power_law_1.01,0.15146880149841307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,power_law_1.2,0.04499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,power_law_1.01,0.15927040576934814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,power_law_1.2,0.0546176016330719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,power_law_1.01,0.16784000396728516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,power_law_1.01,0.1719488024711609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,power_law_1.2,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,power_law_1.01,0.19570560455322267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,power_law_1.2,0.11870720386505126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,power_law_1.2,0.11893119812011718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,power_law_1.01,0.20923519134521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,power_law_1.2,0.12977919578552247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,power_law_1.01,0.2487488031387329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,power_law_1.2,0.13407360315322875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,power_law_1.01,0.28460159301757815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,power_law_1.2,0.12936960458755492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,power_law_1.01,0.3861824035644531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,power_law_1.2,0.14064639806747437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,power_law_1.01,0.47688961029052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,power_law_1.2,0.1416383981704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,power_law_1.01,0.6291903972625732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,power_law_1.2,0.14327679872512816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,power_law_1.01,0.822003173828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,power_law_1.2,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,power_law_1.01,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,power_law_1.01,1.109318447113037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,power_law_1.2,0.16847360134124756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,power_law_1.01,1.431283187866211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,power_law_1.2,0.17770240306854249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,power_law_1.01,0.07852799892425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,power_law_1.01,1.8635967254638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,power_law_1.2,0.17155200242996216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,power_law_1.01,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,power_law_1.2,0.19244799613952637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,power_law_1.01,0.13444479703903198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,power_law_1.01,2.780486488342285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,power_law_1.2,0.22150399684906005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,power_law_1.01,0.14263039827346802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,power_law_1.01,5.253247833251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,power_law_1.2,0.2665855884552002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,power_law_1.01,0.14672640562057496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,power_law_1.01,0.15471999645233153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,power_law_1.2,0.29402239322662355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,power_law_1.01,0.15593600273132324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,power_law_1.2,0.38782079219818116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,power_law_1.01,0.17170560359954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,power_law_1.2,0.4670464038848877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,power_law_1.2,0.04840959906578064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,power_law_1.01,0.17785600423812867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,power_law_1.2,0.6153535842895508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,power_law_1.2,0.059673601388931276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,power_law_1.01,0.1886847972869873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,power_law_1.2,0.796992015838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,power_law_1.2,0.0754368007183075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,power_law_1.01,0.17027839422225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,power_law_1.2,1.179366397857666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,power_law_1.2,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,power_law_1.01,0.1794816017150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,power_law_1.2,1.379251194000244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,power_law_1.2,0.13278720378875733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,power_law_1.01,0.18830080032348634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,power_law_1.2,1.806662368774414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,power_law_1.2,0.1444607973098755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,power_law_1.01,0.20223360061645507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,power_law_1.01,0.24175360202789306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,power_law_1.2,0.14773759841918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,power_law_1.2,3.074176025390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,power_law_1.01,0.27514240741729734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,power_law_1.2,0.15224319696426392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,power_law_1.01,0.3365823984146118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,power_law_1.2,0.15471359491348266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,power_law_1.2,6.266393661499023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,power_law_1.2,0.15818239450454713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,power_law_1.01,0.3865472078323364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,power_law_1.2,0.16350719928741456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,power_law_1.01,0.49448318481445314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,power_law_1.2,0.16596479415893556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,power_law_1.01,0.5931968212127685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,power_law_1.2,0.17374720573425292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,power_law_1.01,0.791648006439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,power_law_1.2,0.18420480489730834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,power_law_1.01,0.9800640106201172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,power_law_1.2,0.196070396900177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,power_law_1.01,1.3644543647766114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,power_law_1.2,0.20528640747070312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,power_law_1.01,1.7545856475830077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,power_law_1.2,0.24253439903259277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,power_law_1.01,2.147609519958496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,power_law_1.2,0.2708224058151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,power_law_1.2,0.3234560012817383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,power_law_1.01,3.3114944458007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,power_law_1.2,0.39165439605712893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,power_law_1.01,6.511283111572266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,power_law_1.2,0.4969344139099121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,power_law_1.2,0.5894976139068604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,power_law_1.2,0.7809855937957764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,power_law_1.2,0.9661055564880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,power_law_1.2,1.348902416229248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,power_law_1.2,1.7251199722290038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,power_law_1.2,2.1230400085449217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,power_law_1.2,3.316339111328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,power_law_1.2,6.509439849853516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,power_law_1.01,0.1137984037399292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,power_law_1.01,0.1559872031211853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,power_law_1.01,0.11051520109176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,power_law_1.01,0.14936959743499756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,power_law_1.01,0.17994879484176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,power_law_1.01,0.2696703910827637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,power_law_1.01,0.2784575939178467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,power_law_1.01,0.28808319568634033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,power_law_1.01,0.29443199634552003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,power_law_1.01,0.30098559856414797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,power_law_1.01,0.30506880283355714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,power_law_1.01,0.30487680435180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,power_law_1.01,0.31614079475402834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,power_law_1.01,0.3382591962814331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,power_law_1.01,0.3583296060562134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,power_law_1.2,0.11216000318527222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,power_law_1.01,0.37059841156005857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,power_law_1.2,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,power_law_1.01,0.3726655960083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,power_law_1.2,0.09251199960708618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,power_law_1.01,0.42223358154296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,power_law_1.2,0.1342911958694458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,power_law_1.01,0.45274882316589354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,power_law_1.2,0.17155840396881103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,power_law_1.01,0.5485824108123779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,power_law_1.2,0.26823039054870607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,power_law_1.2,0.2823424100875854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,power_law_1.01,0.6305024147033691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,power_law_1.2,0.281331205368042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,power_law_1.01,0.7544064044952392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,power_law_1.2,0.29208319187164306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,power_law_1.01,0.8224127769470215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,power_law_1.2,0.2993599891662598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,power_law_1.01,1.0888447761535645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,power_law_1.2,0.3149183988571167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,power_law_1.01,1.3911231994628905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,power_law_1.2,0.31245439052581786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,power_law_1.01,2.005523109436035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,power_law_1.2,0.3312896013259888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,power_law_1.01,2.502988815307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,power_law_1.2,0.336409592628479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,power_law_1.01,2.9283199310302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,power_law_1.2,0.35422720909118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,power_law_1.01,0.10862079858779908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,power_law_1.2,0.38064639568328856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,power_law_1.01,4.826419067382813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,power_law_1.01,0.09164159893989562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,power_law_1.2,0.3784127950668335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,power_law_1.01,0.14201600551605226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,power_law_1.2,0.44084482192993163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,power_law_1.01,10.454348754882812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,power_law_1.01,0.17335679531097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,power_law_1.2,0.4928768157958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,power_law_1.01,0.25445759296417236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,power_law_1.2,0.5891520023345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,power_law_1.01,0.287225604057312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,power_law_1.2,0.5743872165679932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,power_law_1.01,0.3012864112854004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,power_law_1.01,0.2952127933502197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,power_law_1.2,0.6888127803802491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,power_law_1.01,0.3054527997970581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,power_law_1.2,0.8785152435302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,power_law_1.2,0.08528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,power_law_1.01,0.3121920108795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,power_law_1.2,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,power_law_1.2,1.1973888397216796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,power_law_1.01,0.3218368053436279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,power_law_1.2,0.09489279985427856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,power_law_1.2,1.509727954864502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,power_law_1.01,0.3318592071533203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,power_law_1.2,0.1370751976966858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,power_law_1.2,2.1185855865478516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,power_law_1.01,0.34844160079956055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,power_law_1.2,0.16514559984207153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,power_law_1.2,2.5832767486572266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,power_law_1.01,0.3597248077392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,power_law_1.2,0.2634495973587036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,power_law_1.2,3.3451263427734377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,power_law_1.01,0.37324159145355223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,power_law_1.2,0.27942399978637694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,power_law_1.01,0.3861439943313599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,power_law_1.2,0.3059711933135986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,power_law_1.2,5.094540786743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,power_law_1.01,0.42442879676818845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,power_law_1.2,0.30933120250701907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,power_law_1.01,0.45229439735412597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,power_law_1.2,0.30318078994750974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,power_law_1.2,13.332421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,power_law_1.01,0.5173952102661132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,power_law_1.2,0.32284159660339357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,power_law_1.01,0.6087488174438477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,power_law_1.2,0.3375808000564575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,power_law_1.01,0.7752639770507812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,power_law_1.2,0.34333438873291017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,power_law_1.01,0.8416064262390137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,power_law_1.01,1.1240320205688477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,power_law_1.01,1.3902655601501466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,power_law_1.01,1.8757823944091796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,power_law_1.01,2.4267711639404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,power_law_1.01,2.891872024536133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,power_law_1.01,4.675225448608399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,power_law_1.01,9.988813018798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,power_law_1.01,0.0834176003932953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,power_law_1.01,0.10722559690475464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,power_law_1.01,0.14246400594711303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,power_law_1.01,0.1899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,power_law_1.01,0.28225278854370117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,power_law_1.01,0.3030143976211548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,power_law_1.01,0.31081600189208985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,power_law_1.01,0.3196223974227905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,power_law_1.01,0.3308864116668701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,power_law_1.01,0.3403072118759155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,power_law_1.01,0.3411263942718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,power_law_1.01,0.3501375913619995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,power_law_1.01,0.3575999975204468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,power_law_1.01,0.3812671899795532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,power_law_1.01,0.39315199851989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,power_law_1.01,0.4222271919250488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,power_law_1.01,0.48264322280883787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,power_law_1.2,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,power_law_1.01,0.5367104053497315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,power_law_1.2,0.07508479952812194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,power_law_1.01,0.6454592227935791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,power_law_1.2,0.09906560182571411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,power_law_1.01,0.6860159873962403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,power_law_1.2,0.13509759902954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,power_law_1.2,0.1666432023048401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,power_law_1.01,0.8715519905090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,power_law_1.2,0.2760063886642456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,power_law_1.01,1.1814271926879882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,power_law_1.01,0.13731199502944946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,power_law_1.2,0.29279360771179197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,power_law_1.01,1.5445311546325684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,power_law_1.01,0.168012797832489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,power_law_1.2,0.3110208034515381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,power_law_1.01,1.8623743057250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,power_law_1.2,0.3214591979980469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,power_law_1.01,0.2620352029800415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,power_law_1.01,2.5824512481689452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,power_law_1.2,0.3378495931625366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,power_law_1.01,0.14261759519577027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,power_law_1.01,3.120044708251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,power_law_1.2,0.3398848056793213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,power_law_1.01,0.21349120140075684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,power_law_1.01,3.8270206451416016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,power_law_1.2,0.3495296001434326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,power_law_1.01,0.29418239593505857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,power_law_1.2,0.3595583915710449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,power_law_1.01,6.1768959045410154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,power_law_1.01,0.3427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,power_law_1.2,0.37677440643310545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,power_law_1.2,0.3849600076675415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,power_law_1.01,0.44451198577880857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,power_law_1.01,11.759474945068359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,power_law_1.2,0.4017536163330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,power_law_1.01,0.46826882362365724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,power_law_1.2,0.42508797645568847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,power_law_1.01,0.48178558349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,power_law_1.2,0.49370241165161133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,power_law_1.01,0.5206975936889648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,power_law_1.2,0.5236095905303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,power_law_1.01,0.5469056129455566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,power_law_1.2,0.619871997833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,power_law_1.2,0.696665620803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,power_law_1.01,0.5210944175720215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,power_law_1.2,0.8727871894836425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,power_law_1.01,0.5362368106842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,power_law_1.2,1.0782079696655273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,power_law_1.01,0.5792511940002442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,power_law_1.2,1.4165311813354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,power_law_1.01,0.5952383995056152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,power_law_1.2,1.7353984832763671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,power_law_1.01,0.6013760089874267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,power_law_1.2,2.430496025085449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,power_law_1.01,0.6396671772003174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,power_law_1.2,3.1253759384155275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,power_law_1.01,0.6659008026123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,power_law_1.2,3.8266239166259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,power_law_1.01,0.7338943958282471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,power_law_1.01,0.8244159698486329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,power_law_1.2,6.319039916992187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,power_law_1.01,0.9313023567199707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,power_law_1.2,11.993644714355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,power_law_1.01,1.0176704406738282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,power_law_1.01,1.2997568130493165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,power_law_1.01,1.5862719535827636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,power_law_1.01,2.0874176025390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,power_law_1.01,2.784556770324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,power_law_1.01,3.3045440673828126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,power_law_1.01,4.747283172607422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,power_law_1.01,8.664281463623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,power_law_1.2,0.12547199726104735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,power_law_1.2,0.16561280488967894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,power_law_1.2,0.14903039932250978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,power_law_1.2,0.1355072021484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,power_law_1.2,0.20432000160217284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,power_law_1.2,0.3490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,power_law_1.2,0.26801280975341796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,power_law_1.2,0.3726016044616699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,power_law_1.2,0.3652415990829468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,power_law_1.2,0.3103935956954956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,power_law_1.2,0.39166080951690674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,power_law_1.2,0.42057600021362307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,power_law_1.2,0.4313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,power_law_1.2,0.4437312126159668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,power_law_1.2,0.4588223934173584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,power_law_1.2,0.451910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,power_law_1.2,0.5493567943572998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,power_law_1.2,0.5092671871185303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,power_law_1.2,0.6112063884735107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,power_law_1.2,0.7183040142059326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,power_law_1.2,0.497376012802124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,power_law_1.2,0.8678208351135254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,power_law_1.2,0.5125376224517822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,power_law_1.2,1.1154239654541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,power_law_1.2,0.5580095767974853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,power_law_1.2,1.4562111854553224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,power_law_1.2,0.5776639938354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,power_law_1.2,1.9211008071899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,power_law_1.2,0.5698751926422119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,power_law_1.2,2.702835273742676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,power_law_1.2,0.6059199810028076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,power_law_1.2,2.9385536193847654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,power_law_1.2,0.6536448001861572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,power_law_1.01,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,power_law_1.2,0.7113664150238037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,power_law_1.2,4.753862380981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,power_law_1.01,0.11215360164642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,power_law_1.2,0.8215807914733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,power_law_1.01,0.17136000394821166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,power_law_1.2,12.196736145019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,power_law_1.2,0.9121024131774902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,power_law_1.01,0.13508479595184325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,power_law_1.2,1.1130175590515137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,power_law_1.01,0.22152318954467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,power_law_1.2,1.142092800140381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,power_law_1.01,0.3075455904006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,power_law_1.2,1.3608192443847655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,power_law_1.01,0.3425600051879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,power_law_1.01,0.42171521186828614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,power_law_1.2,1.74072322845459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,power_law_1.01,0.4609344005584717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,power_law_1.2,0.08693119883537292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,power_law_1.2,2.2659711837768555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,power_law_1.01,0.49944319725036623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,power_law_1.2,0.11724159717559815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,power_law_1.2,2.925497627258301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,power_law_1.01,0.49944319725036623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,power_law_1.2,0.13196799755096436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,power_law_1.2,3.4110721588134765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,power_law_1.2,0.14180480241775512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,power_law_1.01,0.5252416133880615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,power_law_1.2,6.1334785461425785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,power_law_1.2,0.19545600414276124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,power_law_1.01,0.5416128158569335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,power_law_1.2,0.25914878845214845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,power_law_1.01,0.5473536014556885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,power_law_1.2,11.671494293212891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,power_law_1.2,0.3156928062438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,power_law_1.01,0.5793216228485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,power_law_1.2,0.434662389755249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,power_law_1.01,0.6047167778015137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,power_law_1.01,0.611679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,power_law_1.2,0.4449151992797852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,power_law_1.2,0.4694784164428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,power_law_1.01,0.6626751899719239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,power_law_1.2,0.4846464157104492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,power_law_1.01,0.6958399772644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,power_law_1.2,0.5201727867126464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,power_law_1.01,0.8166015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,power_law_1.2,0.5399424076080322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,power_law_1.01,0.8797439575195313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,power_law_1.2,0.5581439971923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,power_law_1.01,1.055679988861084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,power_law_1.2,0.5948351860046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,power_law_1.01,1.1294015884399413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,power_law_1.2,0.6084224224090576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,power_law_1.01,1.4615872383117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,power_law_1.2,0.6177728176116943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,power_law_1.01,1.7595712661743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,power_law_1.2,0.6667200088500976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,power_law_1.01,2.34531192779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,power_law_1.2,0.7228352069854737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,power_law_1.01,3.1770496368408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,power_law_1.2,0.8395520210266113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,power_law_1.01,3.655814361572266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,power_law_1.2,0.9137087821960449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,power_law_1.01,5.540793609619141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,power_law_1.2,1.0593152046203613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,power_law_1.2,1.1965312004089355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,power_law_1.01,10.62432632446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,power_law_1.2,1.5285056114196778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,power_law_1.2,1.8368831634521485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,power_law_1.2,2.433657646179199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,power_law_1.2,3.186841583251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,power_law_1.2,4.079846572875977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,power_law_1.2,5.863641738891602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,power_law_1.2,11.733273315429688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,4,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,4,power_law_1.01,0.042131200432777405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,4,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,4,power_law_1.01,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,4,power_law_1.01,0.05196160078048706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,4,power_law_1.01,0.05851519703865051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,4,power_law_1.01,0.05950719714164734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,4,power_law_1.01,0.05911679863929749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,4,power_law_1.01,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,4,power_law_1.01,0.0648576021194458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,4,power_law_1.01,0.07958400249481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,4,power_law_1.01,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,4,power_law_1.01,0.08297600150108338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,4,power_law_1.01,0.10602240562438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,4,power_law_1.2,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,4,power_law_1.01,0.1275264024734497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,4,power_law_1.2,0.046758401393890384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,4,power_law_1.01,0.12999039888381958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,4,power_law_1.2,0.04411520063877106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,4,power_law_1.01,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,4,power_law_1.2,0.04842239916324616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,4,power_law_1.01,0.2723072052001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,4,power_law_1.2,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.01,0.2618688106536865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,4,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.01,0.46340479850769045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,4,power_law_1.2,0.058208000659942624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.01,0.6100224018096924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,4,power_law_1.2,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,power_law_1.01,0.0742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.01,1.027609634399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,4,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,power_law_1.01,0.09388160109519958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.01,1.1146495819091797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,4,power_law_1.2,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.01,1.9072320938110352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,4,power_law_1.2,0.07750399708747864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,power_law_1.01,0.12460160255432129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,4,power_law_1.2,0.10126719474792481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.01,2.5361600875854493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,power_law_1.01,0.14160000085830687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,4,power_law_1.2,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.01,4.154086303710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,4,power_law_1.2,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,power_law_1.01,0.23130240440368652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.01,5.189561462402343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,4,power_law_1.2,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,power_law_1.01,0.3166912078857422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,4,power_law_1.01,6.314118576049805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,4,power_law_1.2,0.1414080023765564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,4,power_law_1.2,0.1876863956451416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,power_law_1.01,0.3777472019195557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,4,power_law_1.01,9.65829086303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,4,power_law_1.2,0.241759991645813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.2,0.37794559001922606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,power_law_1.01,0.47808637619018557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,4,power_law_1.01,22.070169067382814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.2,0.48955521583557127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,power_law_1.01,0.5071680068969726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.2,0.655244779586792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,power_law_1.01,0.5284736156463623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.2,1.1150208473205567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.2,1.373043155670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,power_law_1.01,0.5432191848754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.2,1.9485504150390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,power_law_1.2,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,power_law_1.01,0.5665408134460449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.2,2.5471744537353516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,power_law_1.2,0.09352319836616516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.2,4.02624626159668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,power_law_1.01,0.5788479804992676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,4,power_law_1.01,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,power_law_1.2,0.10805759429931641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,4,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.2,5.9173633575439455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,power_law_1.01,0.6226687908172608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,power_law_1.2,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,4,power_law_1.01,0.0744704008102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,4,power_law_1.2,5.570636749267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,power_law_1.01,0.6300479888916015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,4,power_law_1.01,0.0775551974773407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,power_law_1.2,0.21043839454650878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,4,power_law_1.2,10.740000152587891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,4,power_law_1.01,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,power_law_1.01,0.6523647785186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,power_law_1.2,0.2934079885482788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,4,power_law_1.01,0.07856640219688416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,4,power_law_1.2,19.033786010742187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,power_law_1.01,0.684716796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,4,power_law_1.01,0.07939839959144593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,power_law_1.2,0.3345664024353027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,4,power_law_1.01,0.08042880296707153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,power_law_1.01,0.758457612991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,power_law_1.2,0.45194239616394044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,4,power_law_1.01,0.08287360072135926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,4,power_law_1.01,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,power_law_1.01,0.878873634338379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,power_law_1.2,0.48100481033325193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,4,power_law_1.01,0.08573439717292786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,power_law_1.01,1.0394495964050292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,power_law_1.2,0.5047552108764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,4,power_law_1.01,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,4,power_law_1.01,0.09290879964828491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,power_law_1.01,1.0423168182373046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,power_law_1.2,0.551859188079834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,4,power_law_1.2,0.07524480223655701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,4,power_law_1.01,0.1007040023803711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,4,power_law_1.2,0.06992639899253845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,power_law_1.2,0.5735680103302002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,power_law_1.01,1.241158390045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,4,power_law_1.01,0.11177599430084229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,4,power_law_1.2,0.07648640275001525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,4,power_law_1.01,0.11237119436264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,power_law_1.2,0.6055295944213868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,power_law_1.01,1.4201472282409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,4,power_law_1.2,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,4,power_law_1.01,0.13203840255737304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,4,power_law_1.2,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,power_law_1.2,0.6227200031280518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,power_law_1.01,1.7931072235107421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,4,power_law_1.01,0.16090240478515624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,4,power_law_1.2,0.07956479787826538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.01,0.17095040082931517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,power_law_1.2,0.6802752017974854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,4,power_law_1.2,0.08037760257720947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,power_law_1.01,2.243008041381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.01,0.2231679916381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,4,power_law_1.2,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,power_law_1.2,0.6855999946594238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.01,0.26657280921936033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,power_law_1.01,2.965990447998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,4,power_law_1.2,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,power_law_1.2,0.6856063842773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.01,0.417523193359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,4,power_law_1.2,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,power_law_1.01,3.713510513305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.01,0.5358848094940185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,4,power_law_1.2,0.08794879913330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,power_law_1.2,0.7761087894439698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,4,power_law_1.2,0.08815360069274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.01,0.6438079833984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,power_law_1.2,0.8994048118591309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,power_law_1.01,4.4385215759277346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,4,power_law_1.2,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.01,1.084768009185791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,4,power_law_1.2,0.10147199630737305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,power_law_1.2,1.033350372314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.01,1.486361598968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,power_law_1.01,6.968204498291016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,4,power_law_1.2,0.116428804397583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.01,2.0104448318481447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,power_law_1.2,1.0704192161560058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,4,power_law_1.2,0.1198848009109497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,4,power_law_1.01,3.019296073913574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,4,power_law_1.2,0.1317952036857605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,power_law_1.2,1.2829952239990234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,power_law_1.01,13.113420104980468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,4,power_law_1.2,0.16799999475479127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,4,power_law_1.01,4.308095932006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,power_law_1.2,1.4912768363952638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.2,0.19771519899368287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,4,power_law_1.01,10.218624114990234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.2,0.25730559825897215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,power_law_1.2,1.8587072372436524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.2,0.2851583957672119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,power_law_1.2,2.587366485595703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.2,0.4195072174072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.2,0.5030655860900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,power_law_1.2,3.3414398193359376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.2,0.875603199005127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,2,power_law_1.01,0.03162240087985992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,power_law_1.2,3.9380352020263674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.2,1.0941184043884278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,2,power_law_1.2,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,2,power_law_1.01,0.03489919900894165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.2,1.6399103164672852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,2,power_law_1.2,0.0255295991897583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,power_law_1.2,4.742886352539062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,2,power_law_1.01,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.2,2.1877504348754884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,2,power_law_1.2,0.024505600333213806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,2,power_law_1.01,0.04983679950237274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,4,power_law_1.2,2.843532752990723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,2,power_law_1.2,0.02963840067386627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,power_law_1.2,7.112825775146485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,2,power_law_1.01,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,4,power_law_1.2,5.145676803588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,2,power_law_1.2,0.03208320140838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,2,power_law_1.01,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,2,power_law_1.2,0.04129279851913452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,2,power_law_1.01,0.05681279897689819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,power_law_1.2,13.762693786621094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,4,power_law_1.2,10.46864013671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,2,power_law_1.2,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,2,power_law_1.01,0.060089600086212155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,2,power_law_1.2,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,2,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,2,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,2,power_law_1.2,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,2,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,2,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,2,power_law_1.2,0.058508801460266116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,2,power_law_1.01,0.056454402208328244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,2,power_law_1.2,0.055801600217819214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,2,power_law_1.2,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,2,power_law_1.2,0.06111999750137329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,2,power_law_1.2,0.08492159843444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,2,power_law_1.2,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,2,power_law_1.2,0.09144960045814514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,2,power_law_1.2,0.1205631971359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,2,power_law_1.2,0.15371520519256593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,2,power_law_1.2,0.21252479553222656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,2,power_law_1.2,0.27272961139678953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,2,power_law_1.2,0.3943039894104004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,2,power_law_1.2,0.5154304027557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,2,power_law_1.2,0.7630271911621094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,2,power_law_1.2,1.0005120277404784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,2,power_law_1.2,1.4855551719665527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,2,power_law_1.2,1.9727680206298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,2,power_law_1.2,2.481612777709961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,2,power_law_1.2,3.89502067565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,2,power_law_1.2,7.804230499267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,1,power_law_1.01,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,1,power_law_1.01,0.02348800003528595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,1,power_law_1.01,0.023494400084018707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,1,power_law_1.01,0.026150399446487428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,1,power_law_1.01,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,1,power_law_1.01,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,1,power_law_1.01,0.033036801218986514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,1,power_law_1.01,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,1,power_law_1.01,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,1,power_law_1.01,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,1,power_law_1.01,0.041094401478767396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,1,power_law_1.01,0.05331839919090271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,1,power_law_1.01,0.053939199447631835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,1,power_law_1.01,0.060147202014923094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,1,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,1,power_law_1.01,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,1,power_law_1.01,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,1,power_law_1.01,0.11584639549255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.01,0.1473855972290039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.01,0.2088383913040161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.01,0.26248319149017335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.01,0.38227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.01,0.5022975921630859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.01,0.7424575805664062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.01,0.9796992301940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.01,1.4652735710144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.01,1.9424448013305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,1,power_law_1.01,2.410425567626953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,1,power_law_1.01,3.828255844116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,1,power_law_1.01,7.660237121582031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,1,power_law_1.2,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,1,power_law_1.2,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,1,power_law_1.2,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,1,power_law_1.2,0.02656640112400055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,1,power_law_1.2,0.030777600407600404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,1,power_law_1.2,0.03516159951686859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,1,power_law_1.2,0.03345920145511627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,1,power_law_1.2,0.036800000071525577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,1,power_law_1.2,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,1,power_law_1.2,0.03635840117931366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,1,power_law_1.2,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,1,power_law_1.2,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,1,power_law_1.2,0.05400959849357605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,1,power_law_1.2,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,1,power_law_1.2,0.0707584023475647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,1,power_law_1.2,0.07240960001945496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,1,power_law_1.2,0.08718079924583436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,1,power_law_1.2,0.11912959814071655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.2,0.14739840030670165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.2,0.20882558822631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.2,0.26207358837127687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.2,0.3825023889541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.2,0.5051904201507569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.2,0.7379903793334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.2,0.9840576171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.2,1.4640447616577148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.2,1.9428800582885741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,1,power_law_1.2,2.402604866027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,1,power_law_1.2,3.8651264190673826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,1,power_law_1.2,7.665190124511719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,1,power_law_1.01,0.045516800880432126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,1,power_law_1.01,0.050732797384262084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,1,power_law_1.01,0.05400959849357605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,1,power_law_1.01,0.07285119891166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,1,power_law_1.01,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,1,power_law_1.01,0.07363839745521546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,1,power_law_1.01,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,1,power_law_1.01,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,1,power_law_1.01,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,1,power_law_1.01,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,1,power_law_1.01,0.0794048011302948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,1,power_law_1.01,0.08300799727439881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,1,power_law_1.01,0.08492799997329711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,1,power_law_1.01,0.0877888023853302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,1,power_law_1.01,0.09783040285110474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,1,power_law_1.01,0.1011072039604187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,1,power_law_1.01,0.11292799711227416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,1,power_law_1.01,0.1338752031326294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.01,0.14534399509429932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.01,0.1805567979812622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.01,0.2104640007019043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.01,0.27232000827789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.01,0.3321151971817017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.01,0.4597184181213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.01,0.5829951763153076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.01,0.8310144424438477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.01,1.085580825805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,1,power_law_1.01,1.3428159713745118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,1,power_law_1.01,2.1427711486816405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,1,power_law_1.01,4.463961410522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,1,power_law_1.2,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,1,power_law_1.2,0.0490880012512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,1,power_law_1.2,0.050316798686981204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,1,power_law_1.2,0.07203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,1,power_law_1.2,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,1,power_law_1.2,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,1,power_law_1.2,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,1,power_law_1.2,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,1,power_law_1.2,0.07706239819526672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,1,power_law_1.2,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,1,power_law_1.2,0.07939839959144593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,1,power_law_1.2,0.08410239815711976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,1,power_law_1.2,0.08469120264053345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,1,power_law_1.2,0.08636800050735474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,1,power_law_1.2,0.09822720289230347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,1,power_law_1.2,0.09927039742469787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,1,power_law_1.2,0.11395200490951538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,2,power_law_1.01,0.05927039980888367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,1,power_law_1.2,0.13182719945907592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,2,power_law_1.01,0.05928959846496582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.2,0.14391039609909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,2,power_law_1.01,0.06336640119552613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.2,0.17791359424591063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,2,power_law_1.01,0.07994239926338195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.2,0.21006081104278565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,2,power_law_1.01,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.2,0.2694591999053955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,2,power_law_1.01,0.08712319731712341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.2,0.3312959909439087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,2,power_law_1.01,0.09552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.2,0.46134400367736816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,2,power_law_1.01,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,2,power_law_1.01,0.11067520380020142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.2,0.5829951763153076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,2,power_law_1.01,0.058713597059249875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,2,power_law_1.01,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.2,0.8363264083862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,2,power_law_1.01,0.07282559871673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,2,power_law_1.2,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,2,power_law_1.01,0.17887359857559204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.2,1.0843520164489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,2,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,2,power_law_1.2,0.07445120215415954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,2,power_law_1.01,0.20672640800476075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,2,power_law_1.01,0.07468159794807434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,2,power_law_1.2,0.07587199807167053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,1,power_law_1.2,1.3481151580810546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,2,power_law_1.01,0.295411205291748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,2,power_law_1.01,0.07550079822540283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,2,power_law_1.2,0.07648640275001525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,1,power_law_1.2,2.166912078857422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,2,power_law_1.01,0.35971200466156006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,2,power_law_1.01,0.0769216001033783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,2,power_law_1.2,0.077292799949646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,1,power_law_1.2,4.429119873046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,2,power_law_1.01,0.512883186340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,2,power_law_1.01,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,2,power_law_1.2,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,2,power_law_1.01,0.7453440189361572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,2,power_law_1.01,0.07978879809379577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,2,power_law_1.2,0.08528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,2,power_law_1.01,0.08327040076255798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,2,power_law_1.2,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,2,power_law_1.01,1.0961600303649903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,2,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,2,power_law_1.2,0.08793600201606751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,2,power_law_1.01,1.5207167625427247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,4,power_law_1.01,0.013036799430847169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,2,power_law_1.2,0.08856319785118102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,2,power_law_1.01,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,2,power_law_1.01,2.3501632690429686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,4,power_law_1.01,0.01372160017490387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,2,power_law_1.2,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,2,power_law_1.01,0.0914687991142273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,2,power_law_1.01,3.3155776977539064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,4,power_law_1.01,0.014131200313568116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,2,power_law_1.2,0.10042239427566528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,2,power_law_1.01,0.10192639827728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,2,power_law_1.01,3.930188751220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,4,power_law_1.01,0.012831999361515046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,2,power_law_1.2,0.1076159954071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,2,power_law_1.01,0.10315519571304321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,4,power_law_1.01,0.015289600193500518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,2,power_law_1.2,0.12051199674606324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,2,power_law_1.01,0.11768959760665894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,2,power_law_1.01,5.701100921630859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,4,power_law_1.01,0.019801600277423857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,2,power_law_1.2,0.13852159976959227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,2,power_law_1.01,0.13898240327835082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,4,power_law_1.01,0.01693439930677414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,2,power_law_1.01,11.703782653808593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,2,power_law_1.2,0.17047040462493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,2,power_law_1.01,0.14942079782485962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,4,power_law_1.01,0.019392000138759614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,2,power_law_1.2,0.19505280256271362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,2,power_law_1.01,0.20799360275268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,4,power_law_1.01,0.01714559942483902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,2,power_law_1.2,0.2396928071975708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,2,power_law_1.01,0.22316160202026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,4,power_law_1.01,0.01733759939670563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,2,power_law_1.2,0.29684479236602784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,2,power_law_1.01,0.3108031988143921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,4,power_law_1.01,0.019808000326156615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,2,power_law_1.2,0.4530943870544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,2,power_law_1.01,0.33702399730682375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,4,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,2,power_law_1.2,0.4887360095977783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,2,power_law_1.01,0.5932223796844482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,4,power_law_1.01,0.01775359958410263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,2,power_law_1.2,0.8043392181396485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,2,power_law_1.01,0.7372032165527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,4,power_law_1.01,0.019801600277423857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,2,power_law_1.2,1.2317631721496582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,2,power_law_1.01,0.9555135726928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,4,power_law_1.01,0.02144639939069748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,2,power_law_1.2,1.4512895584106444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,2,power_law_1.01,1.283795166015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,4,power_law_1.01,0.02327679991722107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,2,power_law_1.2,1.6976640701293946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,2,power_law_1.01,1.8029823303222656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,4,power_law_1.01,0.02717440128326416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,4,power_law_1.01,0.03311359882354736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,2,power_law_1.2,2.642207908630371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,2,power_law_1.01,2.9963520050048826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,2,power_law_1.2,6.714854431152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,2,power_law_1.01,6.176076889038086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.01,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.01,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.01,0.11420799493789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,4,power_law_1.2,0.05557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.01,0.1674623966217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,4,power_law_1.2,0.06500480175018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.01,0.21907200813293456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,4,power_law_1.2,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.01,0.32023038864135744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,4,power_law_1.2,0.06971520185470581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,4,power_law_1.2,0.08769279718399048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.01,0.42017278671264646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,4,power_law_1.2,0.12828160524368287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,4,power_law_1.01,0.5195072174072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,4,power_law_1.01,0.07831680178642272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,4,power_law_1.2,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,4,power_law_1.2,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,4,power_law_1.01,0.8215807914733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,4,power_law_1.01,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,4,power_law_1.2,0.10029439926147461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,4,power_law_1.2,0.14343680143356324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,4,power_law_1.01,1.6211135864257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,4,power_law_1.01,0.0899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,4,power_law_1.2,0.09966719746589661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,4,power_law_1.2,0.10535680055618286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,4,power_law_1.01,0.10453120470046998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,4,power_law_1.2,0.1060096025466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,4,power_law_1.2,0.11886080503463745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,4,power_law_1.01,0.10576000213623046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,4,power_law_1.2,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,4,power_law_1.2,0.14631680250167847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,4,power_law_1.01,0.10821759700775146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,4,power_law_1.2,0.10804480314254761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,4,power_law_1.2,0.14547840356826783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,4,power_law_1.01,0.10699520111083985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,4,power_law_1.2,0.10704640150070191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,4,power_law_1.2,0.17581440210342408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,4,power_law_1.01,0.10902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,4,power_law_1.2,0.10826879739761353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,4,power_law_1.2,0.20568959712982177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,4,power_law_1.01,0.1098688006401062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,4,power_law_1.2,0.10888320207595825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,4,power_law_1.2,0.24379520416259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,2,power_law_1.01,0.0255295991897583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,4,power_law_1.01,0.11150720119476318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,4,power_law_1.2,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,4,power_law_1.2,0.27696640491485597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,2,power_law_1.01,0.025740799307823182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,4,power_law_1.01,0.11477760076522828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,4,power_law_1.2,0.11727360486984253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,2,power_law_1.01,0.026348799467086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,4,power_law_1.2,0.32817280292510986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,4,power_law_1.01,0.11989760398864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,4,power_law_1.2,0.12197760343551636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,2,power_law_1.01,0.02656640112400055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,4,power_law_1.2,0.5104320049285889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,4,power_law_1.01,0.12133760452270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,4,power_law_1.2,0.12422399520874024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,2,power_law_1.01,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.2,0.7092927932739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,4,power_law_1.01,0.13403520584106446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,4,power_law_1.2,0.13653119802474975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,2,power_law_1.01,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.2,1.0152576446533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,4,power_law_1.01,0.14794880151748657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,4,power_law_1.2,0.15599360466003417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,2,power_law_1.01,0.04149760007858276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.2,1.3882047653198242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,4,power_law_1.01,0.16760319471359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,4,power_law_1.2,0.15926400423049927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,2,power_law_1.01,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.2,1.8156288146972657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,4,power_law_1.01,0.16598399877548217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,4,power_law_1.2,0.1674623966217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,2,power_law_1.01,0.04366720020771027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.2,2.2233856201171873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,4,power_law_1.01,0.2216576099395752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,4,power_law_1.2,0.20266880989074706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,2,power_law_1.01,0.04355199933052063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.01,0.248524808883667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.2,4.029516983032226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.2,0.2725248098373413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,2,power_law_1.01,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.01,0.30626559257507324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.2,0.3365952014923096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,2,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.2,5.884179306030274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.01,0.38366720676422117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.2,0.4177152156829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,2,power_law_1.01,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.2,8.861369323730468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.01,0.5878528118133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.2,0.6348095893859863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,2,power_law_1.01,0.08328959941864014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.01,0.6458303928375244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,2,power_law_1.01,0.09535359740257263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.2,0.7900352001190185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.2,10.820275115966798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.01,1.1318143844604491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,2,power_law_1.01,0.10683519840240478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.2,1.3751680374145507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,4,power_law_1.2,13.802764892578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,2,power_law_1.01,0.12691199779510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.01,1.4846847534179688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.2,1.6784576416015624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,2,power_law_1.01,0.17932800054550171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.01,2.7501312255859376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.2,2.1101823806762696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,4,power_law_1.2,21.844671630859374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,2,power_law_1.01,0.22766079902648925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.01,2.615167999267578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.2,3.737721633911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,2,power_law_1.01,0.32597761154174804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,4,power_law_1.01,5.117427062988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,4,power_law_1.2,4.751488113403321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,2,power_law_1.01,0.4228479862213135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,2,power_law_1.01,0.6227200031280518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,4,power_law_1.01,6.5637054443359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,4,power_law_1.2,47.042425537109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,4,power_law_1.2,6.2977344512939455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,2,power_law_1.01,0.8178879737854003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,4,power_law_1.01,14.269932556152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,2,power_law_1.01,1.2150079727172851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,4,power_law_1.2,13.887213134765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,2,power_law_1.01,1.60949764251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,2,power_law_1.01,2.3956159591674804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,2,power_law_1.01,3.1907136917114256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,2,power_law_1.01,3.998438262939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,2,power_law_1.01,6.36808967590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,2,power_law_1.01,12.653638458251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,2,power_law_1.2,0.045132800936698914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,2,power_law_1.01,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,2,power_law_1.2,0.06872959733009339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,2,power_law_1.2,0.04472959935665131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,2,power_law_1.01,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,2,power_law_1.2,0.07078400254249573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,2,power_law_1.2,0.051072001457214355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,2,power_law_1.01,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,2,power_law_1.2,0.07690879702568054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,2,power_law_1.2,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,2,power_law_1.01,0.10043519735336304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,2,power_law_1.2,0.10090240240097045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,2,power_law_1.2,0.05415679812431336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,2,power_law_1.01,0.10248960256576538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,2,power_law_1.2,0.10232959985733033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,2,power_law_1.2,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,2,power_law_1.01,0.1074112057685852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,1,power_law_1.01,0.022867199778556824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,2,power_law_1.2,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,2,power_law_1.2,0.06335999965667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,2,power_law_1.01,0.10432640314102173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,1,power_law_1.01,0.022867199778556824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,2,power_law_1.2,0.10499199628829955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,2,power_law_1.2,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,2,power_law_1.01,0.10576640367507935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,1,power_law_1.01,0.023686400055885314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,2,power_law_1.2,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,2,power_law_1.2,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,2,power_law_1.01,0.10494719743728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,1,power_law_1.01,0.023897600173950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,2,power_law_1.2,0.10456960201263428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,2,power_law_1.2,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,2,power_law_1.01,0.10454399585723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,1,power_law_1.01,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,2,power_law_1.2,0.10640640258789062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,2,power_law_1.2,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,2,power_law_1.01,0.10658559799194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,1,power_law_1.01,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,2,power_law_1.2,0.10888320207595825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,2,power_law_1.2,0.09756159782409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,2,power_law_1.01,0.1098688006401062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,1,power_law_1.01,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,2,power_law_1.2,0.11523200273513794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,2,power_law_1.2,0.10227199792861938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,2,power_law_1.01,0.11395839452743531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,1,power_law_1.01,0.04847359955310822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,2,power_law_1.2,0.11214720010757447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,2,power_law_1.2,0.11804159879684448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,2,power_law_1.01,0.12172800302505493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,1,power_law_1.01,0.045798400044441225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,2,power_law_1.2,0.12156800031661988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,2,power_law_1.2,0.14997119903564454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,2,power_law_1.01,0.1336192011833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,1,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,2,power_law_1.2,0.13550080060958863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,2,power_law_1.2,0.18030719757080077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,2,power_law_1.01,0.14507520198822021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,1,power_law_1.01,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,2,power_law_1.2,0.1408128023147583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,2,power_law_1.2,0.21427199840545655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,2,power_law_1.01,0.14855680465698243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,1,power_law_1.01,0.06444159746170045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,2,power_law_1.2,0.15270400047302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,2,power_law_1.2,0.30728960037231445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,2,power_law_1.01,0.17949440479278564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,1,power_law_1.01,0.06526079773902893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,2,power_law_1.2,0.18097920417785646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,2,power_law_1.01,0.20979199409484864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,2,power_law_1.2,0.380185604095459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,1,power_law_1.01,0.08061439990997314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,2,power_law_1.2,0.22521600723266602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,2,power_law_1.01,0.25321600437164304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,1,power_law_1.01,0.09516159892082214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,2,power_law_1.2,0.6050496101379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,1,power_law_1.01,0.10621440410614014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,2,power_law_1.2,0.28010880947113037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,2,power_law_1.01,0.33431038856506345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,2,power_law_1.2,0.7371520042419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,1,power_law_1.01,0.12403199672698975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,2,power_law_1.01,0.4294911861419678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,2,power_law_1.2,0.3218816041946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,2,power_law_1.2,1.0957504272460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,1,power_law_1.01,0.17768319845199584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,2,power_law_1.01,0.587449598312378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,2,power_law_1.2,0.44659199714660647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,2,power_law_1.2,1.4785280227661133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.01,0.22417280673980713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,2,power_law_1.2,0.6018367767333984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,2,power_law_1.01,0.713811206817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,2,power_law_1.2,2.236460876464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.01,0.3241215944290161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,2,power_law_1.01,1.1084287643432618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,2,power_law_1.2,0.8467647552490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,2,power_law_1.2,2.8295616149902343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.01,0.4156799793243408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,2,power_law_1.2,0.8699263572692871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,2,power_law_1.01,1.5305343627929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,2,power_law_1.2,4.4194496154785154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.01,0.6165823936462402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,2,power_law_1.2,1.4679295539855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,2,power_law_1.01,2.11975040435791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,2,power_law_1.2,5.879264068603516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.01,0.8133888244628906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,2,power_law_1.2,1.727187156677246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,2,power_law_1.01,2.2037248611450195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.01,1.2121472358703613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,2,power_law_1.2,7.411174774169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,2,power_law_1.2,2.3018688201904296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,2,power_law_1.01,4.517971038818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.01,1.60064640045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,2,power_law_1.2,11.285785675048828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,2,power_law_1.2,4.442240142822266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.01,2.3604352951049803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,2,power_law_1.01,9.780921936035156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.01,3.1796543121337892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,2,power_law_1.2,9.772716522216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,2,power_law_1.2,22.457626342773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,1,power_law_1.01,3.933049774169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,1,power_law_1.01,6.289113616943359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,1,power_law_1.01,12.545094299316407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,1,power_law_1.2,0.026099199056625368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,1,power_law_1.2,0.025900799036026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,1,power_law_1.2,0.033267199993133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,1,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,1,power_law_1.01,0.05196160078048706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,1,power_law_1.2,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,1,power_law_1.2,0.05414400100708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,1,power_law_1.2,0.04924800097942352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,1,power_law_1.01,0.06259199976921082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,1,power_law_1.2,0.06335999965667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,1,power_law_1.2,0.0488319993019104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,1,power_law_1.01,0.06832000017166137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,1,power_law_1.2,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,1,power_law_1.2,0.05109120011329651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,1,power_law_1.01,0.09660159945487976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,1,power_law_1.2,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,1,power_law_1.2,0.05085440278053284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,1,power_law_1.01,0.09699199795722961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,1,power_law_1.2,0.09920639991760254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,1,power_law_1.2,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,1,power_law_1.01,0.10028159618377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,1,power_law_1.2,0.10083839893341065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,1,power_law_1.2,0.05294079780578613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,1,power_law_1.01,0.09660159945487976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,4,power_law_1.01,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,1,power_law_1.2,0.10000640153884888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,1,power_law_1.2,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,1,power_law_1.01,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,4,power_law_1.01,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,1,power_law_1.2,0.10042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,1,power_law_1.2,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,1,power_law_1.01,0.10130560398101807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,1,power_law_1.2,0.10126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,4,power_law_1.01,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,1,power_law_1.2,0.08139520287513732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,1,power_law_1.01,0.10067839622497558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,1,power_law_1.2,0.10309120416641235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,1,power_law_1.2,0.09633920192718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,4,power_law_1.01,0.09843840003013611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,1,power_law_1.01,0.10396800041198731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,1,power_law_1.2,0.10453120470046998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,1,power_law_1.2,0.10966399908065796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,1,power_law_1.01,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,4,power_law_1.01,0.13346560001373292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,1,power_law_1.2,0.10822399854660034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,1,power_law_1.2,0.12992000579833984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,1,power_law_1.01,0.11318399906158447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,4,power_law_1.01,0.15926400423049927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,1,power_law_1.2,0.11169279813766479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,1,power_law_1.2,0.18234239816665648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,1,power_law_1.01,0.11441279649734497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,1,power_law_1.2,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.2,0.22967679500579835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,4,power_law_1.01,0.1928447961807251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,1,power_law_1.01,0.12997759580612184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,1,power_law_1.2,0.12685439586639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.2,0.3304192066192627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,1,power_law_1.01,0.12997759580612184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,4,power_law_1.01,0.20206079483032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,1,power_law_1.2,0.13074560165405275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.2,0.4305727958679199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,1,power_law_1.01,0.14246400594711303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,4,power_law_1.01,0.2065664052963257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.2,0.6296512126922608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,1,power_law_1.2,0.14385279417037963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,1,power_law_1.01,0.1654144048690796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,4,power_law_1.01,0.22972800731658935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,1,power_law_1.2,0.16677759885787963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.2,0.8174400329589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.01,0.1938815951347351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.2,0.19279359579086303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.2,1.218233585357666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,4,power_law_1.01,0.2460927963256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.01,0.2366719961166382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.2,0.23763840198516845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.2,1.6128704071044921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.01,0.27927680015563966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,4,power_law_1.01,0.27762560844421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.2,0.2802432060241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.2,2.3845823287963865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.01,0.371014404296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,4,power_law_1.01,0.30261759757995604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.2,0.36604158878326415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.2,3.1574848175048826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.01,0.4453695774078369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,4,power_law_1.01,0.3470655918121338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.2,0.44367361068725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.01,0.6141312122344971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,1,power_law_1.2,3.9285503387451173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.2,0.6107903957366944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,4,power_law_1.01,0.2954432010650635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.01,0.7879936218261718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,1,power_law_1.2,6.293171310424805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.2,0.7805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,4,power_law_1.01,0.3218688011169434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.01,1.1310400009155273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.2,1.1227968215942383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,1,power_law_1.2,12.54879379272461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.01,1.474073600769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,4,power_law_1.01,0.37348480224609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.2,1.4818047523498534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,1,power_law_1.01,1.8705663681030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,4,power_law_1.01,0.34133760929107665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,1,power_law_1.2,1.839379119873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,1,power_law_1.01,2.948428726196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.01,0.4066624164581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,1,power_law_1.2,2.9631296157836915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,1,power_law_1.01,6.189184188842773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.01,0.5600512027740479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,1,power_law_1.2,6.2428031921386715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.01,0.6753727912902832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.01,0.9205632209777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.01,1.1588288307189942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.01,1.7448192596435548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.01,2.18656005859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.01,3.1407424926757814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,4,power_law_1.2,0.052108800411224364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,4,power_law_1.01,0.10109440088272095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,4,power_law_1.2,0.0844543993473053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.01,4.13238410949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,4,power_law_1.2,0.10206719636917114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,4,power_law_1.01,0.14513280391693115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,4,power_law_1.2,0.06173440217971802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,4,power_law_1.2,0.13463040590286254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,4,power_law_1.01,5.164569473266601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,4,power_law_1.01,0.11543680429458618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,4,power_law_1.2,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,4,power_law_1.2,0.09408000111579895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,4,power_law_1.01,8.192332458496093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,4,power_law_1.01,0.13100160360336305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,4,power_law_1.2,0.12665599584579468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,4,power_law_1.2,0.12008320093154908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,4,power_law_1.01,0.16274559497833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,4,power_law_1.2,0.13854080438613892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,4,power_law_1.2,0.15366400480270387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,4,power_law_1.01,15.59851531982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,4,power_law_1.01,0.19857280254364013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,4,power_law_1.2,0.18645119667053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,4,power_law_1.2,0.19545600414276124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,4,power_law_1.01,0.24977920055389405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,4,power_law_1.2,0.19381760358810424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,4,power_law_1.2,0.2407167911529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,4,power_law_1.01,0.2694272041320801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,4,power_law_1.2,0.2212735891342163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,4,power_law_1.2,0.2501503944396973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,4,power_law_1.01,0.2710720062255859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,4,power_law_1.2,0.23049600124359132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,4,power_law_1.2,0.26897919178009033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,4,power_law_1.2,0.24543359279632568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,4,power_law_1.01,0.2845952033996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,4,power_law_1.2,0.27491838932037355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,4,power_law_1.2,0.27983999252319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,4,power_law_1.01,0.3005759954452515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,4,power_law_1.2,0.2870016098022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,4,power_law_1.2,0.31137919425964355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,4,power_law_1.01,0.3116352081298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,4,power_law_1.2,0.29662721157073973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,2,power_law_1.01,0.030643200874328612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,4,power_law_1.2,0.34783999919891356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,4,power_law_1.01,0.29852800369262694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,4,power_law_1.2,0.3039999961853027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,2,power_law_1.01,0.05606399774551392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,4,power_law_1.2,0.30012800693511965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,4,power_law_1.01,0.3153088092803955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,4,power_law_1.2,0.31588480472564695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,2,power_law_1.01,0.06321280002593994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,4,power_law_1.2,0.3290047883987427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,4,power_law_1.2,0.3305984020233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,4,power_law_1.01,0.32924160957336424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,2,power_law_1.01,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,4,power_law_1.2,0.39495038986206055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,4,power_law_1.2,0.34106879234313964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,2,power_law_1.01,0.14800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,4,power_law_1.01,0.3456255912780762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,4,power_law_1.2,0.36113920211791994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,2,power_law_1.01,0.13714560270309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,4,power_law_1.2,0.36647040843963624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,4,power_law_1.01,0.34603519439697267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.2,0.41788158416748045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,2,power_law_1.01,0.18999040126800537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,4,power_law_1.2,0.4045504093170166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,4,power_law_1.01,0.3738879919052124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.2,0.5976960182189941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,2,power_law_1.01,0.1998080015182495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.2,0.44245119094848634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.01,0.40296320915222167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,2,power_law_1.01,0.19100799560546874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.2,0.6998784065246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.2,0.5026624202728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.01,0.46419200897216795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,2,power_law_1.01,0.20105600357055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.2,0.933356761932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.2,0.531334400177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.01,0.5006207942962646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,2,power_law_1.01,0.21312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.2,1.288268756866455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.2,0.6392511844635009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.01,0.6030720233917236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,2,power_law_1.01,0.23383040428161622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.2,1.777644729614258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.2,0.7379712104797364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.01,0.7208320140838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,2,power_law_1.01,0.2559295892715454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.2,1.012377643585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.01,0.897766399383545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.2,2.189798355102539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,2,power_law_1.01,0.2862080097198486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.2,1.2853952407836915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.01,1.0970368385314941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.2,3.1910655975341795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,2,power_law_1.01,0.26679039001464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.2,1.6640575408935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.01,1.464857578277588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.2,4.495033645629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,2,power_law_1.01,0.26924800872802734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.2,2.109721565246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.01,1.89105281829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,2,power_law_1.01,0.30426878929138185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,4,power_law_1.2,5.776396942138672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,2,power_law_1.01,0.2966975927352905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,4,power_law_1.2,2.358777618408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,4,power_law_1.01,2.2717695236206055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,4,power_law_1.2,8.59533462524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,2,power_law_1.01,0.33208959102630614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,4,power_law_1.2,3.847443389892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,4,power_law_1.01,3.2668926239013674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,2,power_law_1.01,0.4732351779937744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,4,power_law_1.2,18.214585876464845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,2,power_law_1.01,0.5510399818420411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,4,power_law_1.2,7.758918762207031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,4,power_law_1.01,7.176723480224609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,2,power_law_1.01,0.7253312110900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,2,power_law_1.01,0.9092543601989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,2,power_law_1.01,1.2456640243530273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,2,power_law_1.01,1.6293184280395507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,2,power_law_1.01,2.294707107543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,2,power_law_1.01,3.0512447357177734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,2,power_law_1.2,0.032864001393318173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,2,power_law_1.2,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,2,power_law_1.01,3.6639999389648437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,2,power_law_1.2,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,2,power_law_1.2,0.08983680009841918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,2,power_law_1.01,5.9915519714355465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,2,power_law_1.2,0.11461119651794434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,2,power_law_1.2,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,2,power_law_1.2,0.131167995929718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,2,power_law_1.2,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,2,power_law_1.01,11.693561553955078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,2,power_law_1.2,0.13141119480133057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,2,power_law_1.2,0.13157119750976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,2,power_law_1.2,0.1739967942237854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,2,power_law_1.2,0.18542079925537108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,2,power_law_1.2,0.19563519954681396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,2,power_law_1.2,0.21374080181121827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,2,power_law_1.2,0.197708797454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,2,power_law_1.2,0.2902656078338623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,2,power_law_1.2,0.20284159183502198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,1,power_law_1.01,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,2,power_law_1.2,0.3067199945449829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,2,power_law_1.2,0.2171839952468872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,1,power_law_1.01,0.025523200631141663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,2,power_law_1.2,0.32228479385375974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,2,power_law_1.2,0.2450176000595093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,1,power_law_1.01,0.035571199655532834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,2,power_law_1.2,0.3263808012008667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,2,power_law_1.2,0.2558720111846924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,1,power_law_1.01,0.05379840135574341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,2,power_law_1.2,0.348089599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,2,power_law_1.2,0.29009280204772947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,1,power_law_1.01,0.10335999727249146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,2,power_law_1.2,0.3509567975997925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,2,power_law_1.2,0.26591360569000244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,1,power_law_1.01,0.12752000093460084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,2,power_law_1.2,0.35790719985961916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,1,power_law_1.01,0.1674623966217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,2,power_law_1.2,0.2857919931411743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,2,power_law_1.2,0.38045439720153806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,1,power_law_1.01,0.18712960481643676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,2,power_law_1.2,0.3173248052597046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,2,power_law_1.2,0.4036096096038818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,1,power_law_1.01,0.19485440254211425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,2,power_law_1.2,0.3080960035324097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,2,power_law_1.2,0.410752010345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,1,power_law_1.01,0.19489920139312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,2,power_law_1.2,0.3506495952606201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,2,power_law_1.2,0.4543744087219238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,1,power_law_1.01,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,2,power_law_1.2,0.5034751892089844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,2,power_law_1.2,0.4994239807128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,1,power_law_1.01,0.21658880710601808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,2,power_law_1.2,0.5714816093444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,2,power_law_1.2,0.5342400074005127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,1,power_law_1.01,0.23053441047668458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,2,power_law_1.2,0.7797696113586425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,2,power_law_1.2,0.6283775806427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,1,power_law_1.01,0.2510143995285034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,2,power_law_1.2,0.9476991653442383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,2,power_law_1.2,0.6462080001831054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,1,power_law_1.01,0.23585920333862304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,2,power_law_1.2,1.3439807891845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,2,power_law_1.2,0.7728256225585938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,1,power_law_1.01,0.2477504014968872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,2,power_law_1.2,0.8981696128845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,2,power_law_1.2,1.6063232421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,1,power_law_1.01,0.2721152067184448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,2,power_law_1.2,1.1126015663146973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,2,power_law_1.2,2.2909631729125977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,1,power_law_1.01,0.2868671894073486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,2,power_law_1.2,1.3837568283081054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,2,power_law_1.2,3.3028865814208985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.01,0.31472001075744627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,2,power_law_1.2,1.936307144165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.01,0.4078976154327393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,2,power_law_1.2,3.9379711151123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.01,0.4805823802947998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,2,power_law_1.2,2.5046207427978517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,2,power_law_1.2,6.135916900634766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.01,0.6223167896270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,2,power_law_1.2,2.8902656555175783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.01,0.7687424182891845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,2,power_law_1.2,12.070169830322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,2,power_law_1.2,4.766233444213867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.01,1.0532095909118653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.01,1.338700771331787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,2,power_law_1.2,8.905241394042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.01,1.8956991195678712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.01,2.4685888290405273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,1,power_law_1.2,0.023846399784088135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,1,power_law_1.01,3.030348777770996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,1,power_law_1.2,0.0271232008934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,1,power_law_1.01,4.719532775878906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,1,power_law_1.2,0.034297600388526917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,1,power_law_1.2,0.05455999970436096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,1,power_law_1.01,9.285964965820312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,1,power_law_1.2,0.09676160216331482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,1,power_law_1.2,0.1192896008491516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,1,power_law_1.2,0.16516480445861817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,1,power_law_1.2,0.187283194065094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,1,power_law_1.2,0.19833600521087646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,1,power_law_1.01,0.09413759708404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,1,power_law_1.2,0.19630080461502075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,1,power_law_1.01,0.11072640419006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,1,power_law_1.2,0.21001598834991456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,1,power_law_1.01,0.12074879407882691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,1,power_law_1.2,0.2181567907333374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,1,power_law_1.01,0.18178559541702272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,1,power_law_1.2,0.22741119861602782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,1,power_law_1.01,0.24281599521636962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,1,power_law_1.2,0.259769606590271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,1,power_law_1.2,0.24483199119567872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,1,power_law_1.01,0.2923583984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,1,power_law_1.2,0.26119680404663087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,1,power_law_1.01,0.39560320377349856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,1,power_law_1.2,0.09435520172119141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,1,power_law_1.2,0.288044810295105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,1,power_law_1.2,0.10848640203475952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,1,power_law_1.01,0.4152703762054443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,1,power_law_1.2,0.29028480052947997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,1,power_law_1.2,0.1232192039489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,1,power_law_1.01,0.42690558433532716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.2,0.31935360431671145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,1,power_law_1.2,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,1,power_law_1.01,0.44332160949707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.2,0.4371391773223877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,1,power_law_1.2,0.21620481014251708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,1,power_law_1.01,0.45929598808288574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.2,0.4940864086151123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,1,power_law_1.2,0.2694528102874756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,1,power_law_1.01,0.4834559917449951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.2,0.6470655918121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,1,power_law_1.2,0.38331520557403564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,1,power_law_1.01,0.5055808067321778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,1,power_law_1.2,0.40830721855163576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.2,0.7805888175964355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,1,power_law_1.01,0.5027135848999024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,1,power_law_1.2,0.43062400817871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.2,1.070803165435791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,1,power_law_1.01,0.5088575839996338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,1,power_law_1.2,0.44250240325927737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,1,power_law_1.01,0.5244224071502686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.2,1.3463744163513183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,1,power_law_1.2,0.4601151943206787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,1,power_law_1.01,0.5788991928100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.2,1.9198720932006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,1,power_law_1.2,0.4830463886260986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,1,power_law_1.01,0.6597760200500489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.2,2.5062143325805666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,1,power_law_1.2,0.4932864189147949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.01,0.7085311889648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,1,power_law_1.2,3.056108856201172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,1,power_law_1.2,0.4936960220336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.01,0.8162688255310059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,1,power_law_1.2,4.759219360351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,1,power_law_1.2,0.536294412612915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.01,0.8924480438232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,1,power_law_1.2,0.5576064109802246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.01,1.0855744361877442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,1,power_law_1.2,9.299021148681641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,1,power_law_1.2,0.5907648086547852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.01,1.2608768463134765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,1,power_law_1.2,0.6585599899291992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.01,1.6121088027954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.2,0.73023362159729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.01,1.9535039901733398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.2,0.8392000198364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.01,2.667251205444336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.2,0.9125247955322265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,4,power_law_1.01,0.02794879972934723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.01,3.3918079376220702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.2,1.0863871574401855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,4,power_law_1.01,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,4,power_law_1.01,0.034918400645256045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.2,1.2637568473815919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,1,power_law_1.01,4.121728134155274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,4,power_law_1.01,0.046367999911308286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.2,1.632588768005371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,1,power_law_1.01,6.310022354125977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,4,power_law_1.01,0.05498239994049072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.2,1.9764543533325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,4,power_law_1.01,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.2,2.6955072402954103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,4,power_law_1.01,0.07873280048370361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,1,power_law_1.01,12.378240203857422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,4,power_law_1.01,0.07093759775161743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.2,3.4114879608154296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,4,power_law_1.01,0.07525759935379028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,1,power_law_1.2,4.1532737731933596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,4,power_law_1.01,0.08117759823799134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,4,power_law_1.01,0.09265919923782348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,1,power_law_1.2,6.412422180175781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,4,power_law_1.01,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,4,power_law_1.2,0.027577599883079527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,4,power_law_1.01,0.08447359800338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,1,power_law_1.2,12.643456268310548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,4,power_law_1.2,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,4,power_law_1.01,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,4,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,4,power_law_1.01,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,4,power_law_1.01,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,4,power_law_1.2,0.04314880073070526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,4,power_law_1.01,0.10474239587783814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,4,power_law_1.2,0.051532799005508424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,4,power_law_1.2,0.06995199918746949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,4,power_law_1.01,0.13768960237503053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,4,power_law_1.01,0.05666559934616089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,4,power_law_1.2,0.07850239872932434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.01,0.16842880249023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.01,0.227622389793396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,4,power_law_1.01,0.05237119793891907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,4,power_law_1.2,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,4,power_law_1.01,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.01,0.27718400955200195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,4,power_law_1.2,0.07939839959144593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,4,power_law_1.01,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.01,0.38283519744873046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,4,power_law_1.2,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,4,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.01,0.49611520767211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,4,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,4,power_law_1.01,0.09967359900474548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,4,power_law_1.2,0.08164479732513427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.01,0.6646527767181396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,4,power_law_1.01,0.10090240240097045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,4,power_law_1.2,0.08962560296058655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.01,0.9735103607177734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,4,power_law_1.01,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,4,power_law_1.2,0.10007679462432861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.01,1.3144831657409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,4,power_law_1.01,0.1076416015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,4,power_law_1.2,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.01,1.9055488586425782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,4,power_law_1.01,0.10928000211715698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,4,power_law_1.2,0.09415040016174317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,4,power_law_1.01,2.510323143005371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,4,power_law_1.01,0.11010559797286987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,4,power_law_1.2,0.11031039953231811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,4,power_law_1.01,0.11175680160522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,4,power_law_1.01,3.724160003662109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,4,power_law_1.2,0.14449280500411987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,4,power_law_1.01,0.11359360218048095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.2,0.1729920029640198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,4,power_law_1.01,7.636870574951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,4,power_law_1.01,0.11872639656066894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.2,0.23256959915161132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,4,power_law_1.01,0.12978559732437134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.2,0.29689600467681887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,4,power_law_1.01,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.2,0.40705280303955077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,4,power_law_1.01,0.14573440551757813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.2,0.5162240028381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,4,power_law_1.01,0.15926400423049927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.2,0.8084735870361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,2,power_law_1.01,0.08834559917449951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,4,power_law_1.2,0.05805439949035644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.01,0.16745599508285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.2,0.9895168304443359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,4,power_law_1.2,0.04799999892711639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,2,power_law_1.01,0.11928319931030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.01,0.20186240673065187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.2,1.4908479690551757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,4,power_law_1.2,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.01,0.23134078979492187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,2,power_law_1.01,0.10616960525512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.2,2.0894975662231445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,4,power_law_1.2,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.01,0.29280641078948977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,2,power_law_1.01,0.13565440177917482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,4,power_law_1.2,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.01,0.3399104118347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,4,power_law_1.2,2.4104127883911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,2,power_law_1.01,0.1889024019241333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,4,power_law_1.2,0.10104320049285889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.01,0.48264322280883787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,2,power_law_1.01,0.23765120506286622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,4,power_law_1.2,4.205708694458008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,4,power_law_1.2,0.1027008056640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.01,0.591590404510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,2,power_law_1.01,0.2974463939666748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,4,power_law_1.2,0.10698239803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,4,power_law_1.2,8.245574188232421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.01,0.7769343852996826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,2,power_law_1.01,0.3179136037826538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,4,power_law_1.2,0.10884480476379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.01,1.0476799964904786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,4,power_law_1.2,0.11210240125656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,2,power_law_1.01,0.3205888032913208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,4,power_law_1.01,1.203123188018799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,4,power_law_1.2,0.10720000267028809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,2,power_law_1.01,0.33861119747161866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,4,power_law_1.2,0.11191040277481079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,4,power_law_1.01,1.9694784164428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,2,power_law_1.01,0.3539776086807251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,2,power_law_1.01,0.022252799570560457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,4,power_law_1.2,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,2,power_law_1.01,0.35110399723052976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,2,power_law_1.01,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,4,power_law_1.01,3.567340850830078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,4,power_law_1.2,0.12686079740524292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,2,power_law_1.01,0.03922559916973114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,2,power_law_1.01,0.36175999641418455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,4,power_law_1.2,0.1295040011405945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,2,power_law_1.01,0.05440000295639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,4,power_law_1.2,0.13649280071258546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,2,power_law_1.01,0.3578687906265259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,2,power_law_1.01,0.06566399931907654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,4,power_law_1.2,0.14833920001983641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,2,power_law_1.01,0.3806015968322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,2,power_law_1.01,0.09127680063247681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,4,power_law_1.2,0.17130240201950073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,2,power_law_1.2,0.0226623997092247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,2,power_law_1.01,0.3838720083236694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,2,power_law_1.01,0.07200639843940734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.2,0.17827199697494506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,2,power_law_1.2,0.025740799307823182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,2,power_law_1.01,0.41541762351989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,2,power_law_1.01,0.07856000065803528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.2,0.22659199237823485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,2,power_law_1.2,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,2,power_law_1.01,0.47316479682922363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,2,power_law_1.01,0.08552320003509521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.2,0.24217600822448732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,2,power_law_1.2,0.050297600030899045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,2,power_law_1.01,0.5124927997589112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,2,power_law_1.01,0.09188479781150818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.2,0.30709118843078614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,2,power_law_1.2,0.05749760270118713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,2,power_law_1.01,0.6001471996307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,2,power_law_1.01,0.08554239869117737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.2,0.3838720083236694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,2,power_law_1.2,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,2,power_law_1.01,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,2,power_law_1.2,0.07508479952812194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.2,0.49159040451049807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,2,power_law_1.01,0.6284095764160156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,2,power_law_1.01,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,2,power_law_1.2,0.0804095983505249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.2,0.6486847877502442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,2,power_law_1.01,0.7432896137237549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,2,power_law_1.01,0.09105920195579528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,2,power_law_1.2,0.08264960050582885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.2,0.8895423889160157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,2,power_law_1.01,0.8817407608032226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,2,power_law_1.01,0.10232959985733033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,2,power_law_1.2,0.09312639832496643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.2,1.2493568420410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,2,power_law_1.01,1.099443244934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,2,power_law_1.01,0.10622080564498901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,2,power_law_1.2,0.08492799997329711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,4,power_law_1.2,1.5297344207763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,2,power_law_1.01,1.3398591995239257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,2,power_law_1.01,0.10497920513153076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,2,power_law_1.2,0.09292160272598267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,4,power_law_1.2,2.858284759521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,2,power_law_1.01,0.12342400550842285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,2,power_law_1.2,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,2,power_law_1.01,1.8643775939941407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,2,power_law_1.01,0.14758399724960328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,2,power_law_1.2,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,2,power_law_1.01,2.337459182739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,4,power_law_1.2,5.408844757080078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,2,power_law_1.2,0.10581120252609252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,2,power_law_1.01,0.18711040019989014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,2,power_law_1.01,2.9258495330810548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,2,power_law_1.2,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,2,power_law_1.01,0.23381121158599855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,2,power_law_1.2,0.10539519786834717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,2,power_law_1.01,0.3112191915512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,2,power_law_1.01,4.178400039672852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,2,power_law_1.2,0.13265279531478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,2,power_law_1.01,0.3988800048828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,2,power_law_1.2,0.1465664029121399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,2,power_law_1.01,0.5731584072113037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,2,power_law_1.01,8.443545532226562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,2,power_law_1.2,0.1887488007545471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,2,power_law_1.01,0.052934402227401735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,2,power_law_1.01,0.774457597732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,2,power_law_1.2,0.24281599521636962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,2,power_law_1.01,0.05456640124320984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,2,power_law_1.01,1.0867903709411622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,2,power_law_1.2,0.3214783906936646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,2,power_law_1.01,0.06440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,2,power_law_1.01,1.3481280326843261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,2,power_law_1.01,0.08283519744873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,2,power_law_1.2,0.41486082077026365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,2,power_law_1.01,1.8566207885742188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,2,power_law_1.01,0.09388800263404846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,2,power_law_1.2,0.5707136154174804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,2,power_law_1.01,0.12358399629592895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,2,power_law_1.2,0.05249919891357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,2,power_law_1.2,0.772819185256958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,2,power_law_1.01,2.832512092590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,2,power_law_1.01,0.1264448046684265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,2,power_law_1.2,0.05246719717979431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,2,power_law_1.2,1.094591999053955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,2,power_law_1.01,0.1297279953956604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,2,power_law_1.01,5.567411041259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,2,power_law_1.2,0.06231039762496948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,2,power_law_1.2,1.4871871948242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,2,power_law_1.01,0.1266495943069458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,2,power_law_1.2,0.07646080255508422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,2,power_law_1.2,1.8189760208129884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,2,power_law_1.01,0.13608319759368898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,2,power_law_1.2,0.08384640216827392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,2,power_law_1.01,0.1377087950706482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,2,power_law_1.2,2.957855987548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,2,power_law_1.2,0.11886719465255738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,1,power_law_1.01,0.019193600118160247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,2,power_law_1.01,0.13934719562530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,2,power_law_1.2,0.1250175952911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,2,power_law_1.2,5.72081298828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,2,power_law_1.01,0.14591360092163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,1,power_law_1.01,0.021631999313831328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,2,power_law_1.2,0.13197439908981323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,2,power_law_1.01,0.1502079963684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,1,power_law_1.01,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,2,power_law_1.2,0.12828799486160278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,2,power_law_1.01,0.16147199869155884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,1,power_law_1.01,0.03496319949626923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,2,power_law_1.2,0.13688960075378417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,2,power_law_1.01,0.16700799465179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,1,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,2,power_law_1.2,0.13832319974899293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,1,power_law_1.2,0.01958400011062622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,2,power_law_1.01,0.17806719541549682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,1,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,2,power_law_1.2,0.1450816035270691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,1,power_law_1.2,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,2,power_law_1.01,0.20774400234222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,1,power_law_1.01,0.06975359916687011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,2,power_law_1.2,0.14385279417037963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,1,power_law_1.2,0.0253248006105423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,2,power_law_1.01,0.21226239204406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,1,power_law_1.01,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,2,power_law_1.2,0.1524608016014099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,1,power_law_1.2,0.0341376006603241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,2,power_law_1.01,0.2566911935806274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,1,power_law_1.01,0.08001919984817504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,2,power_law_1.2,0.15961600542068483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,1,power_law_1.2,0.04674560129642487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,2,power_law_1.01,0.28961279392242434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,1,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,2,power_law_1.2,0.1651520013809204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,1,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,2,power_law_1.01,0.37813758850097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,1,power_law_1.01,0.09556480050086975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,2,power_law_1.2,0.17968000173568727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,1,power_law_1.2,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,2,power_law_1.01,0.44736638069152834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,1,power_law_1.01,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,2,power_law_1.2,0.21305599212646484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,1,power_law_1.2,0.07652480006217957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,2,power_law_1.01,0.62673921585083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,1,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,2,power_law_1.2,0.21799039840698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,1,power_law_1.2,0.08266879916191101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,1,power_law_1.01,0.10294400453567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,2,power_law_1.2,0.26099839210510256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,1,power_law_1.2,0.08513280153274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,1,power_law_1.01,0.10026880502700805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,2,power_law_1.2,0.31015040874481203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,1,power_law_1.2,0.09578880071640014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,1,power_law_1.01,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,1,power_law_1.2,0.08943359851837158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,2,power_law_1.2,0.3691135883331299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,1,power_law_1.01,0.11870720386505126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,1,power_law_1.2,0.09616000056266785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,2,power_law_1.2,0.44367361068725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,1,power_law_1.01,0.1260800004005432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,1,power_law_1.2,0.10643199682235718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,2,power_law_1.2,0.647872018814087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.01,0.14410239458084106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,1,power_law_1.2,0.10354559421539307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,2,power_law_1.2,0.7936895847320556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.01,0.18016639947891236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,1,power_law_1.2,0.10909440517425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,2,power_law_1.2,1.0879679679870606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,1,power_law_1.2,0.11912959814071655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.01,0.21414399147033691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,2,power_law_1.2,1.5231743812561036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,1,power_law_1.2,0.1271232008934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.01,0.28173439502716063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,2,power_law_1.2,1.9575616836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.2,0.14574719667434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.01,0.355020809173584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.2,0.18097920417785646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.01,0.5042816162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,2,power_law_1.2,2.83941764831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.2,0.21415679454803466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.01,0.6475135803222656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,2,power_law_1.2,5.782611083984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.2,0.2915712118148804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.01,0.934233570098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.2,0.3608000040054321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.01,1.225254440307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.2,0.5055935859680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,1,power_law_1.01,1.5162752151489258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.2,0.6507775783538818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,1,power_law_1.01,2.3833791732788088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.2,0.9411904335021972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.2,1.2338432312011718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,1,power_law_1.01,4.7301887512207035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,1,power_law_1.2,1.5276415824890137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,1,power_law_1.2,2.407142448425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,1,power_law_1.01,0.057785600423812866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,1,power_law_1.01,0.06540160179138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,1,power_law_1.2,4.7375743865966795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,1,power_law_1.01,0.07580800056457519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,1,power_law_1.01,0.0942911982536316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,1,power_law_1.01,0.11313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,1,power_law_1.01,0.16024320125579833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,1,power_law_1.01,0.17272959947586058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,1,power_law_1.2,0.056857597827911374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,1,power_law_1.01,0.17703039646148683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,1,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,1,power_law_1.01,0.18152960538864135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,1,power_law_1.2,0.07282559871673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,1,power_law_1.01,0.18516479730606078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,1,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,1,power_law_1.01,0.18275840282440187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,1,power_law_1.2,0.10477440357208252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,4,power_law_1.01,0.05400959849357605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,1,power_law_1.01,0.19301120042800904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,1,power_law_1.2,0.1600767970085144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,4,power_law_1.01,0.05848960280418396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,1,power_law_1.01,0.19504640102386475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,1,power_law_1.2,0.17215360403060914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,4,power_law_1.01,0.06239359974861145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,1,power_law_1.01,0.21000320911407472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,1,power_law_1.2,0.17605119943618774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,4,power_law_1.01,0.09147520065307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,1,power_law_1.01,0.2190079927444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,1,power_law_1.2,0.1801408052444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,4,power_law_1.01,0.09844480156898498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,1,power_law_1.01,0.2263808012008667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,1,power_law_1.2,0.18629759550094604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,4,power_law_1.01,0.13714560270309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,1,power_law_1.01,0.2460479974746704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,1,power_law_1.2,0.1875264048576355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,4,power_law_1.01,0.1557952046394348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,1,power_law_1.01,0.2986687898635864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,1,power_law_1.2,0.1918272018432617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,4,power_law_1.01,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.01,0.3119935989379883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,1,power_law_1.2,0.19857280254364013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,4,power_law_1.01,0.18097920417785646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.01,0.38202879428863523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,4,power_law_1.01,0.18936959505081177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,1,power_law_1.2,0.20943999290466309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,4,power_law_1.01,0.21948800086975098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.01,0.43630080223083495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,1,power_law_1.2,0.22172799110412597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,4,power_law_1.01,0.2387392044067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,1,power_law_1.2,0.22970879077911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.01,0.5722879886627197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,4,power_law_1.01,0.20453119277954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,1,power_law_1.2,0.25490560531616213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.01,0.7011263847351075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,4,power_law_1.01,0.23872001171112062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,1,power_law_1.2,0.2987328052520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.01,0.9509759902954101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,4,power_law_1.01,0.25919361114501954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.2,0.3161344051361084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.01,1.201030445098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,4,power_law_1.01,0.21578879356384278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.2,0.38536319732666013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.01,1.7038080215454101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,4,power_law_1.01,0.2469183921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.2,0.4498752117156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.01,2.1996223449707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,4,power_law_1.01,0.3419584035873413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.2,0.5838208198547363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,1,power_law_1.01,2.7032192230224608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.01,0.40830721855163576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.2,0.6974400043487549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.01,0.5338496208190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,1,power_law_1.01,4.185984039306641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.2,0.9493760108947754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.01,0.6475008010864258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.2,1.1977791786193848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,1,power_law_1.01,8.29345932006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.01,0.9469183921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.2,1.6997631072998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.01,1.221555233001709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.2,2.1964031219482423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.01,1.7411455154418944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,1,power_law_1.2,2.692198371887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.01,2.3182655334472657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,1,power_law_1.2,4.204256057739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.01,3.373798370361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.01,4.462297439575195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,1,power_law_1.2,8.41228790283203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,4,power_law_1.2,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,4,power_law_1.2,0.033881598711013795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,4,power_law_1.01,5.6810752868652346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,4,power_law_1.2,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,4,power_law_1.01,8.648844909667968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,4,power_law_1.2,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,4,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,4,power_law_1.01,18.081919860839843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,4,power_law_1.2,0.0863103985786438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,4,power_law_1.2,0.10371199846267701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,4,power_law_1.2,0.1145792007446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,4,power_law_1.01,0.10273280143737792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,4,power_law_1.2,0.12849279642105102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,4,power_law_1.01,0.13018239736557008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,4,power_law_1.2,0.1381183981895447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,4,power_law_1.01,0.08921599984169007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,4,power_law_1.2,0.16577279567718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,4,power_law_1.01,0.11565439701080323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,4,power_law_1.2,0.1893183946609497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,4,power_law_1.01,0.15005439519882202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,4,power_law_1.2,0.1487552046775818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,4,power_law_1.2,0.1011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,4,power_law_1.01,0.20062079429626464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,4,power_law_1.2,0.18194559812545777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,4,power_law_1.2,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,4,power_law_1.01,0.2018496036529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,4,power_law_1.2,0.0865664005279541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,4,power_law_1.2,0.20509440898895265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,4,power_law_1.01,0.21783039569854737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,4,power_law_1.2,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,4,power_law_1.2,0.15511679649353027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,4,power_law_1.01,0.21660161018371582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,4,power_law_1.2,0.1326464056968689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,4,power_law_1.2,0.19136639833450317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,4,power_law_1.01,0.22069759368896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,4,power_law_1.2,0.19591679573059081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,4,power_law_1.2,0.24789121150970458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,4,power_law_1.01,0.22520959377288818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,4,power_law_1.2,0.2043328046798706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.2,0.30687360763549804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,4,power_law_1.01,0.2305216073989868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,4,power_law_1.2,0.21475839614868164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.2,0.4404032230377197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,4,power_law_1.01,0.23257598876953126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,4,power_law_1.2,0.2204927921295166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,4,power_law_1.01,0.24569599628448485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.2,0.5993343830108643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,4,power_law_1.2,0.21989760398864747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,4,power_law_1.01,0.26023039817810056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.2,0.7916287899017334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,4,power_law_1.2,0.22992639541625975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,4,power_law_1.01,0.26289279460906984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.2,1.1588479995727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,4,power_law_1.2,0.23339519500732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,4,power_law_1.01,0.28049919605255125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.2,1.6222784042358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,4,power_law_1.2,0.24119040966033936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,4,power_law_1.01,0.3163455963134766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.2,1.9292863845825194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,4,power_law_1.2,0.25858559608459475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.01,0.3444096088409424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.2,3.265625762939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,4,power_law_1.2,0.2590143918991089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.01,0.4007296085357666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,4,power_law_1.2,0.2747711896896362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.2,4.362924957275391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.01,0.43758721351623536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,4,power_law_1.2,0.30261759757995604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.01,0.5236095905303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,4,power_law_1.2,5.229638290405274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,4,power_law_1.2,0.32434558868408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.01,0.6358272075653076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.2,0.3534208059310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,4,power_law_1.2,7.362016296386718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.01,0.8265088081359864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.2,0.433900785446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.01,1.014515209197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.2,0.45316481590270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,4,power_law_1.2,15.396467590332032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.2,0.5686528205871582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.01,1.4049920082092284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.2,0.6458752155303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.01,1.8152704238891602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.2,0.9321855545043946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,4,power_law_1.01,2.2811904907226563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.2,1.1240703582763671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,2,power_law_1.01,0.02465279996395111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,4,power_law_1.01,3.871257781982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,2,power_law_1.01,0.026495999097824095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.2,1.6117055892944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,2,power_law_1.01,0.03304960131645203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.2,2.3061759948730467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,4,power_law_1.01,6.799692535400391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,2,power_law_1.01,0.05374079942703247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,4,power_law_1.2,2.570560073852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,2,power_law_1.01,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,2,power_law_1.01,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,4,power_law_1.2,4.086912155151367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,2,power_law_1.01,0.1024832010269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,2,power_law_1.01,0.0967423975467682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,4,power_law_1.2,9.534815979003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,2,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,2,power_law_1.01,0.11006720066070556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,2,power_law_1.2,0.03290880024433136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,2,power_law_1.01,0.11967999935150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,2,power_law_1.2,0.036595198512077334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,2,power_law_1.01,0.1352512001991272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,2,power_law_1.2,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,2,power_law_1.01,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,2,power_law_1.2,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,2,power_law_1.01,0.12336640357971192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,2,power_law_1.2,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,2,power_law_1.01,0.14098559617996215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,2,power_law_1.2,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,2,power_law_1.01,0.1692479968070984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,2,power_law_1.2,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,2,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,2,power_law_1.01,0.12951680421829223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,2,power_law_1.2,0.10458240509033204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,2,power_law_1.01,0.8116991996765137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,2,power_law_1.01,0.10007679462432861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,2,power_law_1.01,0.15572479963302613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,2,power_law_1.2,0.11704959869384765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,2,power_law_1.01,1.0439488410949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,2,power_law_1.01,0.10069760084152221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,2,power_law_1.01,0.2079616069793701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,2,power_law_1.2,0.14657280445098878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,2,power_law_1.01,1.3599552154541015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,2,power_law_1.01,0.12402559518814087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,2,power_law_1.01,0.24277119636535643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,2,power_law_1.2,0.17339520454406737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,2,power_law_1.01,1.6780031204223633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,2,power_law_1.01,0.15598080158233643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,2,power_law_1.01,0.33902080059051515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,2,power_law_1.2,0.1254591941833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,2,power_law_1.01,2.5717695236206053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,2,power_law_1.01,0.22931199073791503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,2,power_law_1.2,0.15640319585800172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,2,power_law_1.01,0.4092544078826904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,2,power_law_1.01,0.24058239459991454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,2,power_law_1.2,0.1838271975517273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,2,power_law_1.01,0.564908790588379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,2,power_law_1.01,4.904844665527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,2,power_law_1.01,0.2456831932067871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,2,power_law_1.2,0.13139840364456176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,2,power_law_1.01,0.7297664165496827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,2,power_law_1.01,0.25428481101989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,2,power_law_1.2,0.16378240585327147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,2,power_law_1.01,1.1383551597595214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,2,power_law_1.01,0.2567487955093384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,2,power_law_1.2,0.22274560928344728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,2,power_law_1.01,1.401318359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,2,power_law_1.01,0.2561280012130737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,2,power_law_1.2,0.27596800327301024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,2,power_law_1.01,2.1754432678222657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,2,power_law_1.01,0.2702784061431885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,2,power_law_1.2,0.39150080680847166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,2,power_law_1.01,2.7960063934326174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,2,power_law_1.01,0.27681920528411863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,2,power_law_1.2,0.5076223850250244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,2,power_law_1.01,0.2839871883392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,2,power_law_1.01,3.450342559814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,2,power_law_1.2,0.7732480049133301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,2,power_law_1.2,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,2,power_law_1.01,0.2995584011077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,2,power_law_1.2,0.9923839569091797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,2,power_law_1.01,5.518201446533203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,2,power_law_1.2,0.08406400084495544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,2,power_law_1.01,0.306931209564209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,2,power_law_1.2,1.4697664260864258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,2,power_law_1.2,0.09553279876708984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,2,power_law_1.01,0.3177792072296143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,2,power_law_1.01,11.06398696899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,2,power_law_1.2,1.9862848281860352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,2,power_law_1.2,0.11847039461135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,2,power_law_1.01,0.362828803062439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,2,power_law_1.2,2.92425594329834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,2,power_law_1.2,0.1479423999786377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,2,power_law_1.01,0.3994879961013794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,2,power_law_1.2,0.22291839122772217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,2,power_law_1.01,0.4736320018768311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,2,power_law_1.2,3.9302337646484373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,2,power_law_1.2,0.2405247926712036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,2,power_law_1.01,0.5076352119445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,2,power_law_1.2,4.995404815673828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,2,power_law_1.2,0.24708480834960939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,2,power_law_1.01,0.6409535884857178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,1,power_law_1.01,0.02588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,2,power_law_1.2,7.924262237548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,2,power_law_1.2,0.2581439971923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,2,power_law_1.01,0.7646527767181397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,1,power_law_1.01,0.030195200443267824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,2,power_law_1.2,0.25936639308929443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,1,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,2,power_law_1.01,0.9457088470458984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,2,power_law_1.2,15.63702392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,2,power_law_1.2,0.276147198677063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,1,power_law_1.01,0.06213759779930115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,2,power_law_1.01,1.2195008277893067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,2,power_law_1.2,0.27658240795135497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,1,power_law_1.01,0.09696000218391418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,2,power_law_1.01,1.671072006225586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,2,power_law_1.2,0.29049599170684814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,1,power_law_1.01,0.0840448021888733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,2,power_law_1.01,2.147238349914551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,2,power_law_1.2,0.28743040561676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,1,power_law_1.01,0.09428480267524719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,2,power_law_1.01,2.497260856628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,2,power_law_1.2,0.30217599868774414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,1,power_law_1.01,0.10822399854660034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,1,power_law_1.2,0.025702399015426636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,2,power_law_1.01,3.8798591613769533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,2,power_law_1.2,0.31629440784454343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,1,power_law_1.01,0.1229632019996643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,1,power_law_1.2,0.027577599883079527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,2,power_law_1.2,0.33369600772857666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,1,power_law_1.01,0.13319040536880494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,1,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,2,power_law_1.01,7.568096160888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,2,power_law_1.2,0.37015039920806886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,1,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,2,power_law_1.2,0.4053952217102051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,1,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,2,power_law_1.2,0.45516161918640136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,1,power_law_1.2,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,2,power_law_1.2,0.5108479976654052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,1,power_law_1.2,0.07895039916038513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,2,power_law_1.2,0.6341504096984864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,1,power_law_1.2,0.08922240138053894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,1,power_law_1.2,0.10169600248336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,2,power_law_1.2,0.7920512199401856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,1,power_law_1.2,0.11338239908218384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,2,power_law_1.2,1.0353471755981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,1,power_law_1.2,0.11829119920730591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,2,power_law_1.2,1.2062911987304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,1,power_law_1.2,0.13856639862060546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,2,power_law_1.2,1.7083263397216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,1,power_law_1.2,0.12097280025482178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,2,power_law_1.2,2.338707160949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,1,power_law_1.2,0.12360960245132446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,1,power_law_1.01,0.08000640273094177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,2,power_law_1.2,2.741139221191406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,1,power_law_1.2,0.14491519927978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,1,power_law_1.01,0.0969983994960785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,2,power_law_1.2,4.698598480224609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,1,power_law_1.2,0.1404096007347107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,1,power_law_1.01,0.1164736032485962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,1,power_law_1.2,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,1,power_law_1.01,0.15639679431915282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,2,power_law_1.2,9.031148529052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,1,power_law_1.01,0.19491839408874512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,1,power_law_1.2,0.166975998878479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,1,power_law_1.01,0.2919487953186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.2,0.20350079536437987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,1,power_law_1.01,0.314515209197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.2,0.2747391939163208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,1,power_law_1.01,0.33495678901672366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.2,0.344812798500061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,1,power_law_1.01,0.3347775936126709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.2,0.48874878883361816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,1,power_law_1.01,0.339084792137146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.2,0.6368512153625489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,1,power_law_1.01,0.35117440223693847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.2,0.9297087669372559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,1,power_law_1.01,0.35136640071868896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.2,1.2199295997619628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,1,power_law_1.01,0.3636543989181519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.2,1.8111616134643556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,1,power_law_1.01,0.36796159744262696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.2,2.3964864730834963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,1,power_law_1.01,0.40215678215026857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,1,power_law_1.2,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,1,power_law_1.01,0.39582080841064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,1,power_law_1.2,2.9803775787353515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,1,power_law_1.2,0.09082239866256714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,1,power_law_1.01,0.445363187789917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,1,power_law_1.2,4.7518974304199215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,1,power_law_1.2,0.11928319931030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,1,power_law_1.01,0.5178559780120849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,1,power_law_1.2,0.14916479587554932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.01,0.5608767986297607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,1,power_law_1.2,9.473356628417969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,1,power_law_1.2,0.17909120321273803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.01,0.6753471851348877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,1,power_law_1.2,0.2886591911315918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.01,0.7097599983215332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,1,power_law_1.2,0.3083199977874756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.01,0.9100607872009278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,1,power_law_1.2,0.33740160465240476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.01,1.0765695571899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,1,power_law_1.2,0.34885120391845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.01,1.4206272125244142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,1,power_law_1.2,0.3509183883666992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.01,1.759993553161621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,1,power_law_1.2,0.3691456079483032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.01,2.443596839904785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,1,power_law_1.2,0.36751360893249513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.01,3.1706432342529296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,4,power_law_1.01,0.10252799987792968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,1,power_law_1.2,0.3638144016265869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,1,power_law_1.01,3.8159553527832033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,1,power_law_1.2,0.3988415956497192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,4,power_law_1.01,0.1426751971244812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,1,power_law_1.2,0.41152639389038087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,4,power_law_1.01,0.2084223985671997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,1,power_law_1.01,5.894476699829101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,1,power_law_1.2,0.4287424087524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,4,power_law_1.01,0.12260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,1,power_law_1.2,0.46579837799072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,1,power_law_1.01,11.593241882324218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,4,power_law_1.01,0.16376960277557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,1,power_law_1.2,0.5206783771514892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.2,0.5735360145568847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,4,power_law_1.01,0.22826879024505614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.2,0.6949632167816162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,4,power_law_1.01,0.2628799915313721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.2,0.7207808017730712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,4,power_law_1.01,0.3304703950881958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.2,0.9091903686523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,4,power_law_1.01,0.32515199184417726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.2,1.0744768142700196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,4,power_law_1.01,0.3392767906188965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.2,1.423846435546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.2,1.752569580078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,4,power_law_1.01,0.37389440536499025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,4,power_law_1.2,0.10335359573364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.2,2.4455999374389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,4,power_law_1.2,0.1447424054145813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,4,power_law_1.01,0.382476806640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.2,3.1636224746704102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,4,power_law_1.2,0.12524800300598143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,4,power_law_1.01,0.37265279293060305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,4,power_law_1.2,0.12772480249404908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,1,power_law_1.2,3.8318592071533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,4,power_law_1.01,0.40051841735839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,4,power_law_1.2,0.1660223960876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,4,power_law_1.01,0.4017471790313721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,1,power_law_1.2,5.9312896728515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,4,power_law_1.2,0.21723520755767822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,4,power_law_1.01,0.4092991828918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,1,power_law_1.2,11.776697540283203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,4,power_law_1.2,0.23749759197235107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,4,power_law_1.01,0.44693760871887206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,4,power_law_1.2,0.31122560501098634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,4,power_law_1.01,0.46790399551391604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,4,power_law_1.2,0.32698879241943357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,4,power_law_1.01,0.5035264015197753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,4,power_law_1.2,0.34194560050964357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,4,power_law_1.01,0.5666175842285156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,4,power_law_1.2,0.3496959924697876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,4,power_law_1.01,0.6429887771606445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,4,power_law_1.2,0.36446080207824705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,4,power_law_1.01,0.75763840675354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,4,power_law_1.2,0.3685760021209717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,4,power_law_1.01,0.8076607704162597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,4,power_law_1.2,0.38576641082763674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,4,power_law_1.01,1.0769856452941895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,2,power_law_1.01,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,4,power_law_1.2,0.4261184215545654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,4,power_law_1.01,1.3227392196655274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,2,power_law_1.01,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,4,power_law_1.2,0.41936001777648924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,2,power_law_1.01,0.17333760261535644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,4,power_law_1.01,1.6848064422607423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,4,power_law_1.2,0.4412799835205078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,2,power_law_1.01,0.13607679605484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,4,power_law_1.01,2.0604095458984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,4,power_law_1.2,0.47489280700683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,2,power_law_1.01,0.20632319450378417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,4,power_law_1.01,2.4960256576538087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,4,power_law_1.2,0.5195199966430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,2,power_law_1.01,0.27022080421447753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,4,power_law_1.2,0.5899712085723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,4,power_law_1.01,3.605836868286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,2,power_law_1.01,0.31303679943084717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,4,power_law_1.2,0.6622591972351074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,2,power_law_1.01,0.38757760524749757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,4,power_law_1.01,6.799289703369141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,4,power_law_1.2,0.8232255935668945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,2,power_law_1.01,0.3988415956497192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,4,power_law_1.2,0.8867199897766114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,2,power_law_1.01,0.42218241691589353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,4,power_law_1.2,1.1175359725952148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,2,power_law_1.01,0.43549442291259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,4,power_law_1.2,1.320684814453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,2,power_law_1.01,0.4567872047424316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,4,power_law_1.2,1.8742656707763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,2,power_law_1.01,0.4633471965789795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,4,power_law_1.2,2.2742336273193358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,2,power_law_1.01,0.48956799507141113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,4,power_law_1.2,2.6782976150512696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,2,power_law_1.01,0.49202561378479004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,4,power_law_1.2,4.172518539428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,2,power_law_1.2,0.09432960152626038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,2,power_law_1.01,0.5157760143280029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,2,power_law_1.2,0.12588160037994384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,2,power_law_1.01,0.5288832187652588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,4,power_law_1.2,8.222649383544923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,2,power_law_1.2,0.13019520044326782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,2,power_law_1.01,0.5792704105377198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,2,power_law_1.2,0.13386240005493164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,2,power_law_1.01,0.6288256168365478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,2,power_law_1.2,0.19366400241851806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,2,power_law_1.01,0.7117568016052246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,2,power_law_1.2,0.24608640670776366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,2,power_law_1.01,0.803104019165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,2,power_law_1.2,0.28419198989868166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,2,power_law_1.01,0.958739185333252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,2,power_law_1.2,0.3583103895187378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,2,power_law_1.01,1.0419008255004882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,2,power_law_1.2,0.3898688077926636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,2,power_law_1.01,1.2899264335632323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,2,power_law_1.2,0.39640960693359373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,2,power_law_1.01,1.592409610748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,2,power_law_1.2,0.44332160949707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,2,power_law_1.01,2.0468544006347655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,2,power_law_1.2,0.4498623847961426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,2,power_law_1.01,2.602873611450195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,1,power_law_1.01,0.1074560046195984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,2,power_law_1.2,0.44618239402771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,2,power_law_1.01,3.158297538757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,1,power_law_1.01,0.11913599967956542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,2,power_law_1.2,0.4732223987579346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,1,power_law_1.01,0.15681920051574708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,2,power_law_1.2,0.48234238624572756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,2,power_law_1.01,4.632249450683593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,1,power_law_1.01,0.18629759550094604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,2,power_law_1.2,0.5080319881439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,1,power_law_1.01,0.27026560306549074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,2,power_law_1.01,9.095852661132813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,2,power_law_1.2,0.5448319911956787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,1,power_law_1.01,0.3685823917388916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,2,power_law_1.2,0.5977407932281494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,1,power_law_1.01,0.41239042282104493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,2,power_law_1.2,0.6343488216400146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,1,power_law_1.01,0.5199039936065674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,2,power_law_1.2,0.7150527954101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,1,power_law_1.01,0.5547391891479492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,2,power_law_1.2,0.8408255577087402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,1,power_law_1.01,0.5744063854217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,2,power_law_1.2,1.0251520156860352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,1,power_law_1.01,0.1297279953956604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,1,power_law_1.01,0.5891392230987549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,2,power_law_1.2,1.0472576141357421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,1,power_law_1.01,0.14837759733200073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,1,power_law_1.01,0.6173952102661133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,1,power_law_1.01,0.14343039989471434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,2,power_law_1.2,1.350175952911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,1,power_law_1.01,0.1422144055366516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,1,power_law_1.01,0.6333824157714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,2,power_law_1.2,1.6166208267211915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,1,power_law_1.01,0.16307200193405152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,1,power_law_1.01,0.6499584197998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,2,power_law_1.2,2.2000896453857424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,1,power_law_1.01,0.16186239719390869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,1,power_law_1.01,0.6729087829589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,1,power_law_1.2,0.10945919752120972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,1,power_law_1.01,0.155731201171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,2,power_law_1.2,2.670515251159668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,1,power_law_1.2,0.1205183982849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,1,power_law_1.01,0.6901055812835694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,1,power_law_1.01,0.18766720294952394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,2,power_law_1.2,3.1405311584472657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,1,power_law_1.2,0.14569599628448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.01,0.21287040710449218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,1,power_law_1.01,0.7159232139587403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.01,0.29663360118865967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,2,power_law_1.2,4.843046569824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,1,power_law_1.2,0.18032000064849854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,1,power_law_1.01,0.8137920379638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.01,0.3695231914520264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,1,power_law_1.2,0.2536128044128418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,1,power_law_1.01,0.8584447860717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,2,power_law_1.2,9.196678161621094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.01,0.5219136238098144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,1,power_law_1.2,0.32755839824676514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,1,power_law_1.01,1.0145024299621581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.01,0.6626239776611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,1,power_law_1.2,0.3904128074645996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,1,power_law_1.01,1.1314432144165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.01,0.9620160102844239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,1,power_law_1.2,0.4997888088226318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,1,power_law_1.01,1.363276767730713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.01,1.2439680099487305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,1,power_law_1.2,0.5182208061218262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,1,power_law_1.01,1.4685440063476562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.01,1.829075241088867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,1,power_law_1.2,0.5423935890197754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,1,power_law_1.01,1.8965120315551758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.01,2.4181312561035155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,1,power_law_1.2,0.5768127918243409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,1,power_law_1.01,2.210745620727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,1,power_law_1.01,3.012281608581543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,1,power_law_1.2,0.6025983810424804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,1,power_law_1.01,2.982841682434082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,1,power_law_1.01,4.76044807434082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,1,power_law_1.2,0.6259647846221924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,1,power_law_1.01,3.760268783569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,1,power_law_1.2,0.644601583480835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,1,power_law_1.01,9.465459442138672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,1,power_law_1.01,4.531942367553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,1,power_law_1.2,0.6802239894866944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,1,power_law_1.2,0.6646592140197753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,1,power_law_1.01,6.788992309570313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,1,power_law_1.2,0.7252927780151367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,1,power_law_1.2,0.8281023979187012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,1,power_law_1.01,13.18140869140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,1,power_law_1.2,0.8976575851440429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,1,power_law_1.2,1.0419072151184081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,1,power_law_1.2,1.1453375816345215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,1,power_law_1.2,1.3881535530090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,1,power_law_1.2,1.5260607719421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,1,power_law_1.2,1.9391424179077148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,1,power_law_1.2,2.2520639419555666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,1,power_law_1.2,3.0109888076782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,1,power_law_1.2,3.816339111328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,1,power_law_1.2,4.568678283691407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,1,power_law_1.2,6.861100769042968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,1,power_law_1.2,13.372773742675781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,power_law_1.01,0.08410239815711976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,power_law_1.01,0.10184320211410522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,power_law_1.01,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,power_law_1.01,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,power_law_1.01,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,power_law_1.01,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,power_law_1.01,0.11871999502182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,power_law_1.01,0.13674880266189576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,power_law_1.01,0.1534208059310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,power_law_1.01,0.138374400138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,power_law_1.01,0.16907520294189454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,power_law_1.01,0.19100799560546874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,power_law_1.01,0.14143359661102295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,power_law_1.2,0.08629760146141052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,power_law_1.01,0.18035839796066283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,power_law_1.2,0.10449919700622559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,power_law_1.01,0.18609280586242677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,power_law_1.2,0.08691840171813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,power_law_1.01,0.2515903949737549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,power_law_1.2,0.08834559917449951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,power_law_1.01,0.33702399730682375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,power_law_1.2,0.08793600201606751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,power_law_1.01,0.30711679458618163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,power_law_1.2,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,power_law_1.01,0.4392127990722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,power_law_1.01,0.09167360067367554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,power_law_1.2,0.10085120201110839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,power_law_1.01,0.5571775913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,power_law_1.01,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,power_law_1.2,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,power_law_1.01,0.8506624221801757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,power_law_1.01,0.08389120101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,power_law_1.2,0.12376960515975952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,power_law_1.01,1.1101375579833985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,power_law_1.01,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,power_law_1.2,0.1327936053276062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,power_law_1.01,1.6076032638549804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,power_law_1.01,0.08757759928703308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,power_law_1.2,0.1522495985031128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,power_law_1.01,0.09617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,power_law_1.01,2.0292863845825195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,power_law_1.2,0.17907840013504028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,power_law_1.01,0.1084671974182129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,power_law_1.01,3.4380992889404296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,power_law_1.2,0.18992639780044557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,power_law_1.01,0.11297279596328735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,power_law_1.01,4.306470489501953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,power_law_1.2,0.14527360200881959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,power_law_1.2,0.18993279933929444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,power_law_1.01,5.677388763427734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,power_law_1.2,0.18993279933929444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,power_law_1.01,9.17496337890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,power_law_1.2,0.24461441040039061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,power_law_1.2,0.2986687898635864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,power_law_1.01,20.859437561035158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,power_law_1.2,0.3461951971054077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,power_law_1.2,0.4383552074432373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,power_law_1.2,0.5755648136138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,power_law_1.2,0.8300607681274415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,power_law_1.2,1.0642239570617675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,power_law_1.2,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,power_law_1.2,1.4435135841369628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,power_law_1.2,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,power_law_1.2,0.09841279983520508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,power_law_1.2,1.8852672576904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,power_law_1.2,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,power_law_1.2,3.2025279998779297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,power_law_1.2,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,power_law_1.2,4.5134529113769535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,power_law_1.2,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,power_law_1.2,0.09919360280036926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,power_law_1.2,5.503865432739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,power_law_1.2,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,power_law_1.2,8.187379455566406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,power_law_1.2,0.10534399747848511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,power_law_1.2,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,power_law_1.2,20.056434631347656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,power_law_1.2,0.12544000148773193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,power_law_1.2,0.13276159763336182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,power_law_1.2,0.15205760002136232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,power_law_1.2,0.12174719572067261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,power_law_1.2,0.13915519714355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,power_law_1.2,0.1561535954475403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,power_law_1.2,0.17818880081176758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,power_law_1.2,0.2519999980926514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,power_law_1.2,0.23602559566497802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,power_law_1.2,0.3150719881057739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,power_law_1.2,0.40928001403808595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,power_law_1.2,0.6523839950561523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,power_law_1.2,0.8580032348632812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,power_law_1.2,1.3706111907958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,power_law_1.2,1.3517760276794433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,power_law_1.2,2.1080959320068358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,power_law_1.2,3.5861438751220702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,power_law_1.2,3.8789886474609374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,power_law_1.2,8.936345672607422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,power_law_1.2,17.2876220703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,power_law_1.01,0.058905601501464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,power_law_1.01,0.060147202014923094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,power_law_1.01,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,power_law_1.01,0.08082559704780579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,power_law_1.01,0.0806335985660553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,power_law_1.01,0.08594560027122497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,power_law_1.01,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,power_law_1.01,0.09452800154685974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,power_law_1.01,0.09576320052146911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,power_law_1.01,0.11175680160522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,power_law_1.01,0.09618560075759888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,power_law_1.01,0.09905279874801635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,power_law_1.01,0.10397440195083618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,power_law_1.01,0.11503360271453858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,power_law_1.01,0.12034560441970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,power_law_1.2,0.05800960063934326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,power_law_1.01,0.1297600030899048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,power_law_1.01,0.15742080211639403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,power_law_1.2,0.06295679807662964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,power_law_1.01,0.1908031940460205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,power_law_1.2,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,power_law_1.01,0.24568960666656495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,power_law_1.2,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,power_law_1.01,0.3122368097305298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,power_law_1.2,0.08446720242500305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,power_law_1.2,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,power_law_1.01,0.3874176025390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,power_law_1.2,0.09203839898109437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,power_law_1.01,0.5129536151885986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,power_law_1.2,0.10064640045166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,power_law_1.01,0.6810688018798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,power_law_1.2,0.1028864026069641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,power_law_1.01,1.0443840026855469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,power_law_1.2,0.1055616021156311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,power_law_1.01,1.5453503608703614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,power_law_1.2,0.09388800263404846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,power_law_1.01,1.9268863677978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,power_law_1.2,0.10043519735336304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,power_law_1.01,2.2795455932617186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,power_law_1.2,0.10903040170669556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,power_law_1.01,4.087731170654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,power_law_1.2,0.10903040170669556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,power_law_1.2,0.11845760345458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,power_law_1.01,8.19130859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,power_law_1.2,0.12255359888076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,power_law_1.2,0.14016640186309814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,power_law_1.2,0.1573632001876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,power_law_1.2,0.17456640005111695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,power_law_1.2,0.2550528049468994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.05006719827651977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,power_law_1.2,0.3052160024642944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.05619199872016907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,power_law_1.2,0.446943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.060915201902389526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.07771520018577575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,power_law_1.2,0.5268223762512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,power_law_1.2,0.720358419418335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,power_law_1.2,0.9182080268859864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,power_law_1.2,1.452121639251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.09264000058174134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,power_law_1.2,1.8057920455932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.09552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,power_law_1.2,2.6872512817382814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.10126719474792481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,power_law_1.2,4.199923324584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.09512320160865784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,power_law_1.2,9.491500854492188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.09511680006980897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.10536320209503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.11724159717559815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,power_law_1.01,0.12851840257644653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.11764479875564575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.1250048041343689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,power_law_1.01,0.10682879686355591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.1477504014968872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,power_law_1.01,0.1137984037399292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.15901440382003784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,power_law_1.01,0.11786880493164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,power_law_1.01,0.20202240943908692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,power_law_1.01,0.12437759637832642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,power_law_1.01,0.23764479160308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,power_law_1.01,0.13941119909286498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,power_law_1.01,0.31341440677642823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,power_law_1.01,0.15107200145721436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,power_law_1.01,0.3814336061477661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,power_law_1.01,0.17278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,power_law_1.01,0.19530880451202393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,power_law_1.01,0.5501696109771729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,power_law_1.01,0.2403712034225464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,power_law_1.01,0.7047999858856201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,power_law_1.01,0.304256010055542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,power_law_1.01,1.030419158935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,power_law_1.01,0.4433152198791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,power_law_1.01,1.3607680320739746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,power_law_1.01,0.4814144134521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,power_law_1.01,1.7042367935180665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,power_law_1.01,0.738431978225708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,power_law_1.01,2.7738880157470702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,power_law_1.01,1.060582447052002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,power_law_1.01,5.709292984008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,power_law_1.01,1.4785216331481934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,power_law_1.01,1.8828544616699219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,power_law_1.01,2.4382144927978517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,power_law_1.01,3.719308853149414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,power_law_1.01,5.735903930664063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,power_law_1.01,14.65801544189453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.048467200994491574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.0581055998802185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.07713279724121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.0986624002456665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.10417920351028442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.09618560075759888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.11809920072555542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.11830400228500366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.1240447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.14902399778366088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.15825920104980468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,power_law_1.2,0.20027520656585693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,power_law_1.2,0.23252480030059813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,power_law_1.2,0.31122560501098634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,power_law_1.2,0.37102720737457273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,power_law_1.2,0.536300802230835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,power_law_1.2,0.6880576133728027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,power_law_1.2,1.015321636199951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,power_law_1.2,1.3550911903381349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,power_law_1.2,1.7046911239624023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,power_law_1.2,2.789504051208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,power_law_1.2,5.67841911315918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,power_law_1.01,0.12787840366363526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,power_law_1.01,0.14384640455245973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,power_law_1.01,0.1286911964416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,power_law_1.01,0.12992639541625978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,power_law_1.01,0.12993279695510865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,power_law_1.01,0.13565440177917482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,power_law_1.01,0.15941120386123658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,power_law_1.01,0.1463039994239807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,power_law_1.01,0.19095040559768678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,power_law_1.01,0.19383039474487304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,power_law_1.01,0.16883840560913085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,power_law_1.01,0.17436800003051758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,power_law_1.01,0.1907520055770874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,power_law_1.01,0.222707200050354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,power_law_1.01,0.2679680109024048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,power_law_1.01,0.2660928010940552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,power_law_1.01,0.37405440807342527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,power_law_1.01,0.4989759922027588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,power_law_1.01,0.49200639724731443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,power_law_1.01,0.6732607841491699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,power_law_1.01,0.8227711677551269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,power_law_1.01,1.1354944229125976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,power_law_1.2,0.12195199728012085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,power_law_1.01,1.3217920303344726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,power_law_1.2,0.14079999923706055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,power_law_1.01,2.2459007263183595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,power_law_1.2,0.12337919473648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,power_law_1.01,3.2430782318115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,power_law_1.2,0.12502399682998658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,power_law_1.01,0.10848640203475952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,power_law_1.01,4.9879615783691404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,power_law_1.2,0.1227455973625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,power_law_1.01,0.12095359563827515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,power_law_1.2,0.13526400327682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,power_law_1.01,7.016121673583984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,power_law_1.01,0.12097920179367065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,power_law_1.2,0.14488320350646972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,power_law_1.01,0.1133952021598816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,power_law_1.01,8.867526245117187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,power_law_1.2,0.1471168041229248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,power_law_1.01,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,power_law_1.2,0.15943039655685426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,power_law_1.01,0.12833919525146484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,power_law_1.01,18.50030059814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,power_law_1.2,0.20940160751342773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,power_law_1.01,0.1338688015937805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,power_law_1.2,0.2403264045715332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,power_law_1.01,0.14287359714508058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,power_law_1.2,0.3007424116134644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,power_law_1.01,38.67061157226563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,power_law_1.01,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,power_law_1.2,0.2968319892883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,power_law_1.01,0.15189119577407836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,power_law_1.2,0.22148480415344238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,power_law_1.01,0.13879679441452025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,power_law_1.2,0.25137920379638673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,power_law_1.01,0.1551743984222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,power_law_1.2,0.289247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,power_law_1.01,0.16439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,power_law_1.2,0.3400511980056763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,power_law_1.01,0.1785024046897888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,power_law_1.2,0.4825920104980469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,power_law_1.01,0.1906048059463501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,power_law_1.2,0.4838143825531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,power_law_1.01,0.21580159664154053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,power_law_1.2,0.6671103954315185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,power_law_1.01,0.23955199718475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,power_law_1.2,0.8887040138244628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,power_law_1.01,0.3022144079208374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,power_law_1.2,1.1523008346557617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,power_law_1.01,0.4001023769378662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,power_law_1.2,1.6304319381713868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,power_law_1.01,0.5260608196258545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,power_law_1.2,2.4931007385253907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,power_law_1.01,0.6243711948394776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,power_law_1.2,3.741779327392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,power_law_1.01,1.014521598815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,power_law_1.2,5.694131088256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,power_law_1.01,1.4001407623291016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,power_law_1.2,7.715737915039062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,power_law_1.01,1.5396096229553222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,power_law_1.01,2.37642879486084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,power_law_1.2,9.608857727050781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,power_law_1.01,3.5960128784179686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,power_law_1.2,20.320140075683593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,power_law_1.01,5.441664123535157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,power_law_1.01,6.4316162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,power_law_1.2,43.490386962890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,power_law_1.01,10.206893157958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,power_law_1.01,27.2962890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,power_law_1.2,0.14369280338287355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,power_law_1.2,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,power_law_1.2,0.13345919847488402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,power_law_1.2,0.12158080339431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,power_law_1.2,0.1211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,power_law_1.2,0.1265023946762085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,power_law_1.2,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,power_law_1.2,0.14534399509429932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,power_law_1.2,0.18506879806518556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,power_law_1.2,0.18958719968795776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,power_law_1.2,0.1379647970199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,power_law_1.2,0.1543552041053772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,power_law_1.2,0.15947519540786742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,power_law_1.2,0.1746240019798279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,power_law_1.2,0.20146560668945312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,power_law_1.2,0.2178368091583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,power_law_1.2,0.24405760765075685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,power_law_1.2,0.3493184089660645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,power_law_1.2,0.3896703958511353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,power_law_1.2,0.4650303840637207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,power_law_1.2,0.59651198387146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,power_law_1.2,1.1334976196289062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,power_law_1.2,1.5109503746032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,power_law_1.2,2.090732765197754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,power_law_1.2,2.2639936447143554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,power_law_1.2,3.4983230590820313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,power_law_1.2,4.909804916381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,power_law_1.2,5.473004913330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,power_law_1.2,12.951225280761719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,power_law_1.2,31.928671264648436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,power_law_1.01,0.09100800156593322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,power_law_1.01,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,power_law_1.01,0.08569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,power_law_1.01,0.1260159969329834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,power_law_1.01,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,power_law_1.01,0.1260480046272278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,power_law_1.01,0.1446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,power_law_1.01,0.12992000579833984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,power_law_1.01,0.1340224027633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,power_law_1.01,0.13893760442733766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,power_law_1.01,0.13973759412765502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,power_law_1.01,0.14118399620056152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,power_law_1.01,0.1415168046951294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,power_law_1.01,0.15143040418624878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,power_law_1.01,0.16679680347442627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,power_law_1.01,0.17251839637756347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,power_law_1.01,0.1844032049179077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,power_law_1.01,0.22106239795684815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,power_law_1.01,0.258950400352478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,power_law_1.01,0.3486527919769287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,power_law_1.01,0.41603841781616213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,power_law_1.01,0.6050623893737793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,power_law_1.01,0.7457600116729737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,power_law_1.01,1.1842368125915528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,power_law_1.01,1.332921600341797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,power_law_1.01,2.0931264877319338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,power_law_1.2,0.091212797164917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,power_law_1.01,3.1494848251342775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,power_law_1.2,0.08403199911117554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,power_law_1.01,4.125772857666016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,power_law_1.2,0.0953279972076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,power_law_1.2,0.12338559627532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,power_law_1.01,7.649158477783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,power_law_1.2,0.1192896008491516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.1181056022644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,power_law_1.01,14.850553894042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,power_law_1.2,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.1215872049331665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,power_law_1.2,0.14713599681854247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.1240447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,power_law_1.2,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.12670719623565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,power_law_1.2,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,power_law_1.2,0.14010239839553834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.12774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,power_law_1.2,0.141593599319458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.1312000036239624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,power_law_1.2,0.1438591957092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.13489279747009278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,power_law_1.2,0.14304640293121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.12813440561294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,power_law_1.2,0.15656319856643677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.1379583954811096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,power_law_1.2,0.16904959678649903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,power_law_1.01,0.1381824016571045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,power_law_1.2,0.17683839797973633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,power_law_1.01,0.1445248007774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,power_law_1.2,0.1880895972251892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,power_law_1.01,0.16213120222091676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,power_law_1.2,0.24707839488983155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,power_law_1.01,0.16213120222091676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,power_law_1.2,0.2659199953079224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,power_law_1.01,0.17052160501480101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,power_law_1.2,0.3814336061477661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,power_law_1.01,0.2055488109588623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,power_law_1.2,0.4830143928527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,power_law_1.01,0.23340160846710206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,power_law_1.2,0.5792704105377198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,power_law_1.01,0.2923775911331177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,power_law_1.2,0.7891839981079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,power_law_1.01,0.35136001110076903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,power_law_1.2,1.1752256393432616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,power_law_1.01,0.4715904235839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,power_law_1.2,1.4500736236572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,power_law_1.01,0.5883200168609619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,power_law_1.01,0.8404352188110351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,power_law_1.2,2.210291290283203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,power_law_1.01,1.0863871574401855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,power_law_1.2,3.440447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,power_law_1.01,1.6268672943115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,power_law_1.2,4.655590438842774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,power_law_1.01,2.162816047668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,power_law_1.2,6.5149696350097654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,power_law_1.01,2.7366655349731444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,power_law_1.2,16.81481018066406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,power_law_1.01,4.468851089477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,power_law_1.01,11.670540618896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.07530879974365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.12239359617233277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.12443519830703735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.13304959535598754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.12732160091400146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.12732160091400146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.1292736053466797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.13100800514221192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.13919999599456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,power_law_1.2,0.14690560102462769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,power_law_1.2,0.1603008031845093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,power_law_1.2,0.16089600324630737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,power_law_1.2,0.17139840126037598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,power_law_1.2,0.2010432004928589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,power_law_1.2,0.2311487913131714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,power_law_1.2,0.2972991943359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,power_law_1.2,0.3492480039596558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,power_law_1.2,0.47731838226318357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,power_law_1.2,0.5735743999481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,power_law_1.2,0.812172794342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,power_law_1.2,1.0584704399108886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,power_law_1.2,1.5785280227661134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,power_law_1.2,2.202560043334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,power_law_1.2,2.6910144805908205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,power_law_1.2,4.373222351074219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,power_law_1.2,11.506553649902344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,power_law_1.01,0.17907840013504028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,power_law_1.01,0.2800447940826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,power_law_1.01,0.13075200319290162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,power_law_1.01,0.16139520406723024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,power_law_1.01,0.21492478847503663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,power_law_1.01,0.2661247968673706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,power_law_1.01,0.3420991897583008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,power_law_1.01,0.373638391494751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,power_law_1.01,0.37752320766448977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,power_law_1.01,0.38531200885772704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,power_law_1.01,0.38429439067840576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,power_law_1.01,0.4053760051727295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,power_law_1.01,0.4019008159637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,power_law_1.01,0.43507838249206543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,power_law_1.01,0.43425917625427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,power_law_1.01,0.41541762351989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,power_law_1.01,0.44245758056640627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,power_law_1.01,0.4703104019165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,power_law_1.01,0.5235328197479248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,power_law_1.01,0.5980800151824951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,power_law_1.01,0.6054719924926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,power_law_1.01,0.6949632167816162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,power_law_1.2,0.16516480445861817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,power_law_1.01,0.8264512062072754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,power_law_1.2,0.24133760929107667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,power_law_1.01,1.0345151901245118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,power_law_1.2,0.11294080018997192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,power_law_1.01,1.344377613067627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,power_law_1.01,1.919046401977539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,power_law_1.01,0.1647871971130371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,power_law_1.2,0.19791359901428224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,power_law_1.01,2.3032575607299806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,power_law_1.01,0.11717760562896729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,power_law_1.2,0.24714241027832032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,power_law_1.01,0.1359295964241028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,power_law_1.2,0.31916160583496095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,power_law_1.01,2.711840057373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,power_law_1.01,0.19756799936294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,power_law_1.2,0.36584959030151365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,power_law_1.01,3.9998207092285156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,power_law_1.01,0.24508800506591796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,power_law_1.2,0.3840831995010376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,power_law_1.01,0.33826560974121095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,power_law_1.2,0.3892159938812256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,power_law_1.01,10.573843383789063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,power_law_1.01,0.35669119358062745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,power_law_1.2,0.38161919116973875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,power_law_1.2,0.39001600742340087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,power_law_1.01,0.3562688112258911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,power_law_1.2,0.41911678314208983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,power_law_1.01,0.37880959510803225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,power_law_1.2,0.4174784183502197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,power_law_1.01,0.4025792121887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,power_law_1.2,0.42853760719299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,power_law_1.01,0.39355518817901614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,power_law_1.2,0.45925121307373046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,power_law_1.01,0.41730561256408694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,power_law_1.2,0.47480320930480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,power_law_1.01,0.4230527877807617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,power_law_1.2,0.5194687843322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,power_law_1.01,0.4261184215545654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,power_law_1.2,0.5632959842681885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,power_law_1.01,0.4359488010406494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,power_law_1.2,0.6222527980804443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,power_law_1.01,0.4498879909515381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,power_law_1.2,0.6560704231262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,power_law_1.01,0.4887104034423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,power_law_1.2,0.8309503555297851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,power_law_1.01,0.5137728214263916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,power_law_1.2,0.9243712425231934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,power_law_1.01,0.5887360095977783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,power_law_1.01,0.5985536098480224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,power_law_1.2,1.2366592407226562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,power_law_1.01,0.7355648040771484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,power_law_1.2,1.5763263702392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,power_law_1.01,0.844320011138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,power_law_1.2,2.172127914428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,power_law_1.01,1.059763240814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,power_law_1.2,2.936908721923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,power_law_1.01,1.3141375541687013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,power_law_1.2,3.4789569854736326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,power_law_1.01,1.8312448501586913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,power_law_1.2,6.4023490905761715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,power_law_1.01,2.175923156738281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,power_law_1.01,2.7452735900878906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,power_law_1.2,14.289170837402343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,power_law_1.01,4.719551849365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,power_law_1.01,9.160633850097657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,power_law_1.2,0.10969599485397338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,power_law_1.2,0.1635648012161255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,power_law_1.2,0.14451839923858642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,power_law_1.2,0.20757761001586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,power_law_1.2,0.2417855978012085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,power_law_1.2,0.3417407989501953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,power_law_1.2,0.3464576005935669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,power_law_1.2,0.3650880098342896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,power_law_1.2,0.3806591987609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,power_law_1.2,0.3871999979019165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,power_law_1.2,0.41111040115356445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,power_law_1.2,0.3996095895767212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,power_law_1.2,0.42052478790283204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,power_law_1.2,0.4482431888580322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,power_law_1.2,0.44086399078369143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,power_law_1.2,0.48919677734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,power_law_1.2,0.5182079792022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,power_law_1.2,0.5657983779907226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,power_law_1.2,0.6638976097106933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,power_law_1.2,0.649894380569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,power_law_1.2,0.7638207912445069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,power_law_1.2,0.947321605682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,power_law_1.2,1.1548095703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,power_law_1.2,1.521183967590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,power_law_1.2,1.928121566772461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,power_law_1.2,2.549139213562012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,power_law_1.2,3.3000766754150392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,power_law_1.2,5.543654251098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,power_law_1.2,12.152499389648437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,power_law_1.01,0.11436159610748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,power_law_1.01,0.13933440446853637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,power_law_1.01,0.20325119495391847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,power_law_1.01,0.2585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,power_law_1.01,0.3390271902084351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,power_law_1.01,0.36810879707336425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,power_law_1.01,0.37118079662323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,power_law_1.01,0.3865472078323364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,power_law_1.01,0.4068096160888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,power_law_1.01,0.4107200145721436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,power_law_1.01,0.40414719581604003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,power_law_1.01,0.42731518745422364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,power_law_1.01,0.43425917625427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,power_law_1.01,0.4649792194366455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,power_law_1.01,0.4776768207550049
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,power_law_1.01,0.5104383945465087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,power_law_1.01,0.5504576206207276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,power_law_1.01,0.6383935928344726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,power_law_1.01,0.6839104175567627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,power_law_1.01,0.8051199913024902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,power_law_1.01,0.9661248207092286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,power_law_1.01,1.1539263725280762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,power_law_1.2,0.0881600022315979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,power_law_1.01,1.4308159828186036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,power_law_1.2,0.11396479606628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,power_law_1.01,1.946905517578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,power_law_1.2,0.09389439821243287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,power_law_1.01,2.493926429748535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,power_law_1.2,0.13854080438613892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,power_law_1.01,3.140070343017578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,power_law_1.2,0.17273600101470948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,power_law_1.2,0.2290560007095337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,power_law_1.01,4.655123138427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,power_law_1.2,0.3175296068191528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,power_law_1.2,0.3613440036773682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,power_law_1.01,10.363302612304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,power_law_1.2,0.3513279914855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,power_law_1.2,0.38430080413818357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,power_law_1.2,0.4000703811645508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,power_law_1.2,0.4039616107940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,power_law_1.2,0.4219776153564453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,power_law_1.2,0.44492158889770506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,power_law_1.2,0.4567872047424316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,power_law_1.2,0.4772799968719482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.09088640213012696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,power_law_1.2,0.5292863845825195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.10131200551986694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,power_law_1.2,0.5718848228454589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,power_law_1.01,0.1486143946647644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,power_law_1.2,0.581715202331543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,power_law_1.01,0.22009599208831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,power_law_1.2,0.6523647785186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,power_law_1.01,0.27682559490203856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,power_law_1.2,0.6916863918304443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,power_law_1.01,0.3726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,power_law_1.2,0.8629119873046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,power_law_1.01,0.3900736093521118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,power_law_1.2,0.956287956237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,power_law_1.01,0.4107647895812988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,power_law_1.2,1.2624832153320313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,power_law_1.01,0.41547517776489257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,power_law_1.01,0.4330944061279297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,power_law_1.2,1.5256383895874024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,power_law_1.01,0.4564352035522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,power_law_1.2,2.1134975433349608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,power_law_1.01,0.4670720100402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,power_law_1.2,2.803385543823242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,power_law_1.01,0.4826367855072021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,power_law_1.2,3.412255859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,power_law_1.01,0.49125118255615235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,power_law_1.01,0.5092735767364502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,power_law_1.2,5.4805248260498045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,power_law_1.01,0.5428415775299072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,power_law_1.01,0.6145472049713134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,power_law_1.2,11.363609313964844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,power_law_1.01,0.6879936218261719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,power_law_1.01,0.7772928237915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,power_law_1.01,0.8772416114807129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,power_law_1.01,1.0573056221008301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,power_law_1.01,1.2756352424621582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,power_law_1.01,1.632601547241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,power_law_1.01,1.9821887969970704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,power_law_1.01,2.7276607513427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,power_law_1.01,3.456959915161133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,power_law_1.01,0.09237120151519776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,power_law_1.01,0.07114880084991455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,power_law_1.01,4.211820983886719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,power_law_1.01,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,power_law_1.01,6.631334686279297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,power_law_1.01,0.06766719818115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,power_law_1.01,0.08483840227127075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,power_law_1.01,0.11599999666213989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,power_law_1.01,12.994291687011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,power_law_1.01,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,power_law_1.01,0.11968640089035035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,power_law_1.01,0.12255359888076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,power_law_1.01,0.12378879785537719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,power_law_1.01,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,power_law_1.01,0.12583039999008178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,power_law_1.01,0.13073920011520385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,power_law_1.01,0.13299839496612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,power_law_1.01,0.14303359985351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,power_law_1.01,0.14998400211334229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,power_law_1.01,0.15266560316085814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.09700480103492737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,power_law_1.01,0.17128959894180298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.1418496012687683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,power_law_1.01,0.18113280534744264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,power_law_1.2,0.18786560297012328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,power_law_1.01,0.21819519996643066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,power_law_1.2,0.2520319938659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,power_law_1.01,0.23683199882507325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,power_law_1.2,0.35666561126708984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,power_law_1.01,0.29926400184631347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,power_law_1.2,0.3871999979019165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,power_law_1.01,0.3529536008834839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,power_law_1.2,0.40051841735839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,power_law_1.01,0.5108543872833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,power_law_1.2,0.42653441429138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,power_law_1.01,0.5890880107879639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,power_law_1.2,0.43553919792175294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,power_law_1.01,0.7908031940460205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,power_law_1.2,0.4715775966644287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,power_law_1.2,0.091839998960495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,power_law_1.01,1.0262720108032226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,power_law_1.2,0.4654399871826172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,power_law_1.2,0.05294079780578613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,power_law_1.2,0.4969855785369873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,power_law_1.01,1.3091584205627442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,power_law_1.2,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,power_law_1.2,0.5096767902374267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,power_law_1.01,2.3028543472290037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,power_law_1.2,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,power_law_1.2,0.5305535793304443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,power_law_1.2,0.08117759823799134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,power_law_1.01,3.9432960510253907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,power_law_1.2,0.5653696060180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,power_law_1.2,0.11314560174942016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,power_law_1.2,0.6300864219665527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,power_law_1.2,0.11765120029449463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,power_law_1.2,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,power_law_1.2,0.6843647956848145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,power_law_1.2,0.12379519939422608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,power_law_1.2,0.7916736125946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,power_law_1.2,0.12726399898529053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,power_law_1.2,0.9047231674194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,power_law_1.2,0.131167995929718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,power_law_1.2,1.1166912078857423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,power_law_1.2,0.13055360317230225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,power_law_1.2,1.3178112030029296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,power_law_1.2,0.13893120288848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,power_law_1.2,1.6682111740112304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,power_law_1.2,0.13772159814834595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,power_law_1.2,0.1498047947883606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,power_law_1.2,2.0169919967651366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,power_law_1.2,0.14856959581375123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,power_law_1.2,2.717011260986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,power_law_1.01,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,power_law_1.2,0.1491968035697937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,power_law_1.01,0.04766719937324524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,power_law_1.2,3.428287887573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,power_law_1.2,0.17744640111923218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,power_law_1.01,0.05441920161247253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,power_law_1.2,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,power_law_1.2,4.227820968627929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,power_law_1.01,0.06158080101013184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,power_law_1.2,0.22822399139404298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,power_law_1.01,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,power_law_1.2,6.818937683105469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,power_law_1.2,0.2509567975997925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,power_law_1.01,0.11338239908218384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,power_law_1.2,0.3308480024337769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,power_law_1.01,0.11851520538330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,power_law_1.2,0.41933441162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,power_law_1.2,13.706573486328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,power_law_1.01,0.1217919945716858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,power_law_1.2,0.602617597579956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,power_law_1.01,0.12282240390777588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,power_law_1.2,0.826476764678955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,power_law_1.01,0.12097280025482178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,power_law_1.2,1.106003189086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,power_law_1.01,0.1281280040740967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,power_law_1.2,1.51211519241333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,power_law_1.01,0.12814079523086547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,power_law_1.2,1.6190080642700195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,power_law_1.01,0.13100160360336305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,power_law_1.01,0.1353279948234558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,power_law_1.2,3.286092758178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,power_law_1.01,0.14554879665374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,power_law_1.01,0.1445248007774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,power_law_1.2,8.52631072998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,power_law_1.01,0.1559999942779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,power_law_1.01,0.1654207944869995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,power_law_1.01,0.18421759605407714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,power_law_1.01,0.21702399253845214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,power_law_1.01,0.23955199718475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,power_law_1.01,0.28971519470214846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,power_law_1.01,0.36161279678344727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,power_law_1.01,0.47241601943969724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,power_law_1.01,0.5510528087615967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,power_law_1.01,0.8445247650146485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,power_law_1.01,1.0308863639831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,power_law_1.2,0.05906559824943543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,power_law_1.01,1.3690176010131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,power_law_1.2,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,power_law_1.01,1.9506431579589845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,power_law_1.2,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,power_law_1.2,0.07382400035858154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,power_law_1.01,4.500812911987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,power_law_1.2,0.11559040546417236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,power_law_1.2,0.12027519941329956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,power_law_1.2,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,power_law_1.2,0.12787840366363526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,power_law_1.2,0.12707200050354003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,power_law_1.2,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,power_law_1.2,0.13320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,power_law_1.2,0.13341439962387086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,power_law_1.2,0.14016640186309814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,power_law_1.2,0.14876799583435057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,power_law_1.2,0.15410560369491577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,power_law_1.2,0.15368319749832154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,power_law_1.2,0.17252479791641234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,power_law_1.2,0.18391679525375365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,power_law_1.2,0.22249600887298585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,power_law_1.2,0.2603840112686157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,power_law_1.2,0.3310400009155273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,power_law_1.2,0.3652415990829468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,power_law_1.01,0.04661760032176972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,power_law_1.2,0.4780928134918213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,power_law_1.01,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,power_law_1.2,0.6949696063995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,power_law_1.01,0.05072640180587769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,power_law_1.2,0.9169728279113769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,power_law_1.01,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,power_law_1.2,1.2473024368286132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,power_law_1.01,0.08634880185127258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,power_law_1.2,1.4189311981201171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,power_law_1.01,0.1162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,power_law_1.01,0.12649600505828856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,power_law_1.2,2.373523139953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,power_law_1.01,0.12813440561294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,power_law_1.01,0.12833919525146484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,power_law_1.2,4.814310455322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,power_law_1.2,0.0480320006608963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,power_law_1.01,0.13100800514221192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,power_law_1.01,0.13182719945907592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,power_law_1.01,0.13426560163497925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,power_law_1.2,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,power_law_1.01,0.1410367965698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,power_law_1.2,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,power_law_1.01,0.14614399671554565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,power_law_1.2,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,power_law_1.01,0.15701119899749755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,power_law_1.2,0.125382399559021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,power_law_1.01,0.16129920482635499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,power_law_1.2,0.12910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,power_law_1.01,0.163372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,power_law_1.2,0.13095680475234986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,power_law_1.01,0.18547840118408204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,power_law_1.01,0.200217604637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,power_law_1.2,0.13383040428161622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,power_law_1.01,0.2375040054321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,power_law_1.2,0.1450943946838379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,power_law_1.01,0.2784575939178467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,power_law_1.2,0.1426367998123169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,power_law_1.01,0.3335488080978394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,power_law_1.2,0.15287679433822632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,power_law_1.01,0.42099838256835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,power_law_1.2,0.16229759454727172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,power_law_1.01,0.5764351844787597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,power_law_1.2,0.16944639682769774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,power_law_1.01,0.7142720222473145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,power_law_1.2,0.17211519479751586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,power_law_1.01,1.0521792411804198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,power_law_1.2,0.18545279502868653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,power_law_1.01,1.2543231964111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,power_law_1.2,0.20981121063232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,power_law_1.01,1.4957823753356934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,power_law_1.2,0.24563200473785402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,power_law_1.2,0.28375680446624757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,power_law_1.01,2.6000640869140623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,power_law_1.2,0.337388801574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,power_law_1.01,4.662195205688477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,power_law_1.2,0.43091840744018556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.038227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,power_law_1.2,0.5859903812408447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.0441536009311676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,power_law_1.2,0.6798208236694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.05667200088500977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,power_law_1.2,1.0818495750427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.07182719707489013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,power_law_1.2,1.3517631530761718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.08062080144882203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,power_law_1.2,1.8123519897460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.1277184009552002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,power_law_1.2,2.713267135620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.13408000469207765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.13694080114364623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,power_law_1.2,5.290060806274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.14001920223236083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.14165120124816893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.14615679979324342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.15148799419403075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.15681920051574708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.16785279512405396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,power_law_1.01,0.17770880460739136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,power_law_1.01,0.1875264048576355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,power_law_1.01,0.20698881149291992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,power_law_1.01,0.24384639263153077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,power_law_1.01,0.26905601024627684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,power_law_1.01,0.3296639919281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,power_law_1.01,0.39745919704437255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,power_law_1.01,0.5072256088256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,power_law_1.01,0.6100351810455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,power_law_1.01,0.8211839675903321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,power_law_1.01,1.016160011291504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,power_law_1.01,1.4300543785095214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.03878400027751923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,power_law_1.01,1.8193792343139648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,power_law_1.01,2.2611200332641603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.05618559718132019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,power_law_1.01,3.4712894439697264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.07585920095443725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,power_law_1.01,7.091129302978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.12788480520248413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.13074560165405275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.14016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.14263039827346802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.143449604511261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.14754559993743896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.1545024037361145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.15859839916229249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.16883840560913085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.18071039915084838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,power_law_1.2,0.18890880346298217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,power_law_1.2,0.20611200332641602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,power_law_1.2,0.24296319484710693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,power_law_1.2,0.2741055965423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,power_law_1.2,0.329804801940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,power_law_1.2,0.4019008159637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,power_law_1.2,0.513318395614624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,power_law_1.2,0.6084095954895019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,power_law_1.2,0.813753604888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,power_law_1.2,1.0095487594604493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,power_law_1.2,1.4426943778991699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,power_law_1.2,1.8529087066650392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,power_law_1.2,2.295897674560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,power_law_1.2,3.584864044189453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,power_law_1.2,7.2586112976074215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,power_law_1.01,0.20881919860839843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,power_law_1.01,0.2565311908721924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,power_law_1.01,0.11094399690628051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,power_law_1.01,0.16206079721450806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,power_law_1.01,0.19633280038833617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,power_law_1.01,0.27088000774383547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,power_law_1.01,0.2663615942001343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,power_law_1.01,0.28089599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,power_law_1.01,0.30487680435180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,power_law_1.01,0.28739840984344484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,power_law_1.2,0.20774400234222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,power_law_1.01,0.31675519943237307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,power_law_1.2,0.0969215989112854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,power_law_1.01,0.31880319118499756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,power_law_1.2,0.10454399585723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,power_law_1.01,0.3110016107559204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,power_law_1.2,0.13894399404525756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,power_law_1.01,0.32614400386810305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,power_law_1.2,0.1966912031173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,power_law_1.01,0.33805439472198484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,power_law_1.2,0.2788095951080322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,power_law_1.01,0.33886721134185793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,power_law_1.2,0.2896575927734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,power_law_1.01,0.3792128086090088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,power_law_1.2,0.287225604057312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,power_law_1.01,0.41750397682189944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,power_law_1.2,0.301145601272583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,power_law_1.2,0.30517120361328126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,power_law_1.01,0.4736320018768311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,power_law_1.2,0.3130239963531494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,power_law_1.01,0.6075712203979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,power_law_1.2,0.3314624071121216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,power_law_1.01,0.5837503910064697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,power_law_1.2,0.329203200340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,power_law_1.01,0.7388224124908447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,power_law_1.2,0.3406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,power_law_1.01,0.8133824348449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,power_law_1.2,0.35112318992614744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,power_law_1.01,1.1748607635498047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,power_law_1.2,0.3476416110992432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,power_law_1.01,1.2551487922668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,power_law_1.2,0.39044480323791503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,power_law_1.01,1.9572032928466796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,power_law_1.2,0.48178558349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,power_law_1.01,2.5160896301269533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,power_law_1.2,0.5002048015594482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,power_law_1.01,3.6013248443603514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,power_law_1.2,0.631283187866211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,power_law_1.2,0.5894847869873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,power_law_1.01,4.88152961730957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,power_law_1.2,0.740447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,power_law_1.01,0.1174847960472107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,power_law_1.2,0.9386943817138672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,power_law_1.01,11.398489379882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,power_law_1.01,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,power_law_1.2,1.2931839942932128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,power_law_1.01,0.10499839782714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,power_law_1.2,1.637049674987793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,power_law_1.01,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,power_law_1.2,2.5647872924804687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,power_law_1.01,0.18753279447555543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,power_law_1.2,3.220556640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,power_law_1.01,0.26004478931427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,power_law_1.2,4.493388748168945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,power_law_1.01,0.27232000827789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,power_law_1.01,0.28723840713500975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,power_law_1.2,6.738617706298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,power_law_1.01,0.29196159839630126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,power_law_1.01,0.2887104034423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,power_law_1.2,17.538758850097658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,power_law_1.01,0.3071295976638794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,power_law_1.01,0.30877439975738524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,power_law_1.01,0.316979193687439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,power_law_1.01,0.3247551918029785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,power_law_1.01,0.3337408065795898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,power_law_1.01,0.35703680515289304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,power_law_1.01,0.37246079444885255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,power_law_1.01,0.41546878814697263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,power_law_1.01,0.43021440505981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,power_law_1.01,0.5391744136810303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,power_law_1.01,0.5952960014343261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,power_law_1.01,0.7310656070709228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,power_law_1.01,0.7912896156311036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,power_law_1.01,1.0026368141174316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,power_law_1.2,0.11681920289993286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,power_law_1.01,1.3845184326171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,power_law_1.2,0.08407040238380432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,power_law_1.01,1.9342464447021483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,power_law_1.2,0.09182720184326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,power_law_1.01,2.153011131286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,power_law_1.2,0.1399616003036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,power_law_1.01,2.6615167617797852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,power_law_1.2,0.17662080526351928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,power_law_1.2,0.26243200302124026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,power_law_1.01,4.911859130859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,power_law_1.2,0.2890624046325684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,power_law_1.2,0.28638720512390137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,power_law_1.01,10.884646606445312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,power_law_1.2,0.2947904109954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,power_law_1.2,0.296230411529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,power_law_1.2,0.3146559953689575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,power_law_1.2,0.32407679557800295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,power_law_1.2,0.32039039134979247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,power_law_1.2,0.31629440784454343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,power_law_1.2,0.34946560859680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,power_law_1.2,0.34432640075683596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,power_law_1.2,0.3750783920288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,power_law_1.2,0.4285247802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,power_law_1.2,0.45801601409912107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,power_law_1.2,0.5636928081512451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,power_law_1.2,0.6230847835540771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,power_law_1.2,0.7580480098724365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,power_law_1.2,0.8354687690734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,power_law_1.2,1.0867456436157226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,power_law_1.2,1.2723072052001954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,power_law_1.2,1.838982391357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,power_law_1.2,2.769804763793945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,power_law_1.2,3.1023231506347657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,power_law_1.2,5.71905288696289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,power_law_1.2,13.452287292480468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,power_law_1.01,0.08759040236473084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,power_law_1.01,0.11011840105056762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,power_law_1.01,0.09393280148506164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,power_law_1.01,0.14001280069351196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,power_law_1.01,0.17441920042037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,power_law_1.01,0.2637120008468628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,power_law_1.01,0.2770240068435669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,power_law_1.01,0.2897279977798462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,power_law_1.01,0.3026240110397339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,power_law_1.01,0.3085504055023193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,power_law_1.01,0.31040639877319337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,power_law_1.2,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,power_law_1.01,0.3185728073120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,power_law_1.2,0.08182399868965148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,power_law_1.01,0.32330880165100095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,power_law_1.2,0.09471359848976135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,power_law_1.01,0.3367552042007446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,power_law_1.2,0.12870399951934813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,power_law_1.01,0.359552001953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,power_law_1.2,0.1717120051383972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,power_law_1.01,0.36447360515594485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,power_law_1.2,0.2544384002685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,power_law_1.01,0.378003191947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,power_law_1.2,0.2683840036392212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,power_law_1.01,0.42099199295043943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,power_law_1.2,0.28843519687652586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,power_law_1.01,0.44822402000427247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,power_law_1.2,0.314246392250061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,power_law_1.01,0.5465343952178955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,power_law_1.01,0.5948671817779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,power_law_1.2,0.31958398818969724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,power_law_1.2,0.3251136064529419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,power_law_1.01,0.729414415359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,power_law_1.2,0.3275712013244629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,power_law_1.01,0.8206975936889649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,power_law_1.2,0.340883207321167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,power_law_1.01,1.028428840637207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,power_law_1.2,0.35050880908966064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,power_law_1.01,1.2940608024597169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,power_law_1.2,0.36419200897216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,power_law_1.01,1.9358911514282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,power_law_1.2,0.3642175912857056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,power_law_1.01,2.2648128509521483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,power_law_1.2,0.3824512004852295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,power_law_1.01,2.849305534362793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,power_law_1.2,0.42792320251464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,power_law_1.2,0.4723519802093506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,power_law_1.01,4.514854431152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,power_law_1.2,0.5493696212768555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,power_law_1.2,0.5697663784027099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,power_law_1.01,8.948242950439454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,power_law_1.2,0.7318143844604492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,power_law_1.2,0.8627840042114258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,power_law_1.2,1.1489472389221191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,power_law_1.2,1.3980416297912597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,power_law_1.2,2.152467155456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,power_law_1.2,2.3340736389160157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,power_law_1.2,3.193881607055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,power_law_1.2,5.70068473815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.08268160223960877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,power_law_1.2,12.889369201660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.09907839894294738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.14328960180282593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,power_law_1.01,0.18629759550094604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,power_law_1.01,0.2788671970367432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,power_law_1.01,0.3001728057861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,power_law_1.01,0.3087807893753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,power_law_1.01,0.3173696041107178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,power_law_1.01,0.32515840530395507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,power_law_1.01,0.3347775936126709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,power_law_1.01,0.3470720052719116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,power_law_1.01,0.35193600654602053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,power_law_1.01,0.37020800113677976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,power_law_1.01,0.3890496015548706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,power_law_1.01,0.4152575969696045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,power_law_1.01,0.4197696208953857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,power_law_1.01,0.4806015968322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,power_law_1.01,0.5272704124450683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,power_law_1.01,0.6219264030456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,power_law_1.01,0.7134335994720459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,power_law_1.01,0.9035136222839355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,power_law_1.01,1.1568511962890624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,power_law_1.01,1.468556785583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,power_law_1.01,1.7411455154418944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,power_law_1.01,2.408793640136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.06438400149345398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.08446720242500305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,power_law_1.01,3.1302911758422853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.10146559476852417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,power_law_1.01,3.835628890991211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.13422080278396606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,power_law_1.01,5.896537780761719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,power_law_1.2,0.1778496026992798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,power_law_1.2,0.26857600212097166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,power_law_1.01,12.227110290527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,power_law_1.2,0.30229759216308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,power_law_1.2,0.3223488092422485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,power_law_1.2,0.32674560546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,power_law_1.2,0.3382015943527222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,power_law_1.2,0.3533695936203003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,power_law_1.2,0.3654016017913818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,power_law_1.2,0.3715903997421265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,power_law_1.2,0.38305280208587644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,power_law_1.2,0.4023168087005615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,power_law_1.2,0.4154304027557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,power_law_1.2,0.43466877937316895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,power_law_1.2,0.48504958152770994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,power_law_1.2,0.527238416671753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,power_law_1.2,0.6243135929107666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,power_law_1.2,0.7199615955352783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,power_law_1.2,0.9001855850219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,power_law_1.2,1.159660816192627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,power_law_1.2,1.4780735969543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,power_law_1.2,1.807846450805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,power_law_1.2,2.4669055938720703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,power_law_1.2,3.193939208984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,power_law_1.2,4.009523010253906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,power_law_1.2,6.11541748046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,power_law_1.2,12.631065368652344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,power_law_1.01,0.16206079721450806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,power_law_1.01,0.26801280975341796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,power_law_1.01,0.48305277824401854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,power_law_1.01,0.15024640560150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,power_law_1.01,0.21313281059265138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,power_law_1.01,0.33315200805664064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,power_law_1.01,0.3824959993362427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,power_law_1.01,0.45274882316589354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,power_law_1.01,0.47110400199890134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,power_law_1.01,0.5051712036132813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,power_law_1.2,0.16725759506225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,power_law_1.01,0.49042558670043945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,power_law_1.2,0.2759552001953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,power_law_1.01,0.48142080307006835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,power_law_1.2,0.33330559730529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,power_law_1.01,0.5334335803985596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,power_law_1.2,0.14960000514984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,power_law_1.01,0.54202241897583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,power_law_1.2,0.222489595413208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,power_law_1.01,0.5428544044494629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,power_law_1.2,0.2708415985107422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,power_law_1.01,0.5653632164001465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,power_law_1.2,0.31466240882873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,power_law_1.01,0.5879039764404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,power_law_1.2,0.44737920761108396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,power_law_1.01,0.6190271854400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,power_law_1.2,0.46985602378845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,power_law_1.01,0.6573376178741455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,power_law_1.2,0.4797311782836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,power_law_1.01,0.7318848133087158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,power_law_1.2,0.46581120491027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,power_law_1.01,0.7810239791870117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,power_law_1.2,0.4981696128845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,power_law_1.01,0.922764778137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,power_law_1.2,0.509222412109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,power_law_1.01,0.944057559967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,power_law_1.2,0.5444543838500977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,power_law_1.2,0.5665728092193604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,power_law_1.01,1.228934383392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,power_law_1.2,0.5751679897308349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,power_law_1.01,1.5338687896728516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,power_law_1.2,0.5817215919494629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,power_law_1.01,1.932147216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,power_law_1.2,0.6384575843811036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,power_law_1.01,2.4464767456054686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,power_law_1.2,0.701535987854004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,power_law_1.01,2.9815999984741213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,power_law_1.2,0.803929615020752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,power_law_1.01,4.554886245727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,power_law_1.2,0.9292736053466797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,power_law_1.2,1.1203519821166992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,power_law_1.01,10.62842254638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,power_law_1.2,1.085536003112793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,power_law_1.2,1.3198016166687012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,power_law_1.01,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,power_law_1.01,0.165830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,power_law_1.2,1.6649023056030274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,power_law_1.01,0.26576640605926516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,power_law_1.2,2.432486343383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,power_law_1.01,0.1443071961402893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,power_law_1.2,3.046681594848633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,power_law_1.01,0.2000256061553955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,power_law_1.2,3.7393089294433595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,power_law_1.01,0.30959999561309814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,power_law_1.01,0.345030403137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,power_law_1.2,5.8903358459472654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,power_law_1.01,0.4326784133911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,power_law_1.2,15.776454162597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,power_law_1.01,0.44988160133361815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,power_law_1.01,0.4793600082397461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,power_law_1.01,0.4965375900268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,power_law_1.01,0.5191103935241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,power_law_1.01,0.5354879856109619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,power_law_1.01,0.5551424026489258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,power_law_1.01,0.5797247886657715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,power_law_1.01,0.5739840030670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,power_law_1.01,0.6005951881408691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,power_law_1.01,0.6169792175292969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,power_law_1.01,0.6712768077850342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,power_law_1.01,0.7597375869750976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,power_law_1.01,0.79169921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,power_law_1.01,0.9825663566589355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,power_law_1.2,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,power_law_1.01,1.0038592338562011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,power_law_1.2,0.16761599779129027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,power_law_1.01,1.2342528343200683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,power_law_1.2,0.163155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,power_law_1.01,1.5642111778259278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,power_law_1.2,0.13156479597091675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,power_law_1.2,0.20152320861816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,power_law_1.01,2.0079935073852537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,power_law_1.2,0.2835200071334839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,power_law_1.01,2.7857343673706056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,power_law_1.2,0.3115839958190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,power_law_1.01,3.085663986206055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,power_law_1.2,0.4211455821990967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,power_law_1.01,4.823174285888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,power_law_1.2,0.44490880966186525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,power_law_1.2,0.45187201499938967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,power_law_1.01,9.492819213867188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,power_law_1.2,0.4670271873474121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,power_law_1.2,0.5030720233917236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,power_law_1.2,0.524294376373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,power_law_1.2,0.528876781463623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,power_law_1.2,0.5542655944824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,power_law_1.2,0.5583744049072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,power_law_1.2,0.6022143840789795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,power_law_1.2,0.6638271808624268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,power_law_1.2,0.6761280059814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,power_law_1.2,0.8006464004516601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,power_law_1.2,0.8612671852111816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,power_law_1.2,1.0781503677368165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,power_law_1.2,1.031993579864502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,power_law_1.2,1.3382464408874513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,power_law_1.2,1.5260479927062989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,power_law_1.2,2.1442943572998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,power_law_1.2,2.834105682373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,power_law_1.2,3.5117889404296876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,power_law_1.2,5.297766494750976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,power_law_1.2,12.13354263305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,power_law_1.01,0.08614400029182434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,power_law_1.01,0.11420799493789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,power_law_1.01,0.1705407977104187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,power_law_1.01,0.1379647970199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,power_law_1.01,0.22008960247039794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,power_law_1.01,0.2962752103805542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,power_law_1.01,0.3407167911529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,power_law_1.01,0.4437312126159668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,power_law_1.01,0.45683841705322265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,power_law_1.01,0.4871551990509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,power_law_1.01,0.5088448047637939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,power_law_1.2,0.0871295988559723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,power_law_1.01,0.5092735767364502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,power_law_1.2,0.11683199405670167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,power_law_1.01,0.5330239772796631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,power_law_1.2,0.12357120513916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,power_law_1.01,0.5477568149566651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,power_law_1.2,0.1381183981895447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,power_law_1.01,0.570310401916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,power_law_1.2,0.1923967957496643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,power_law_1.01,0.5870912075042725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,power_law_1.2,0.2626431941986084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,power_law_1.01,0.6108672142028808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,power_law_1.2,0.304422402381897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,power_law_1.01,0.695027208328247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,power_law_1.2,0.4223936080932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,power_law_1.01,0.7474175930023194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,power_law_1.2,0.4481919765472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,power_law_1.01,0.8555647850036621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,power_law_1.2,0.46007680892944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,power_law_1.01,0.8506624221801757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,power_law_1.2,0.48137598037719725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,power_law_1.01,1.0067328453063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,power_law_1.2,0.512505578994751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,power_law_1.01,1.1969087600708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,power_law_1.2,0.5247935771942138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,power_law_1.01,1.504800033569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,power_law_1.2,0.5473216056823731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,power_law_1.01,1.6776447296142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,power_law_1.2,0.5702335834503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,power_law_1.01,2.151750373840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,power_law_1.2,0.5821248054504394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,power_law_1.01,2.743212890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,power_law_1.2,0.6433663845062256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,power_law_1.01,3.346752166748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,power_law_1.2,0.7019455909729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,power_law_1.2,0.7707583904266357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,power_law_1.01,5.337619018554688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,power_law_1.2,0.9304896354675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,power_law_1.01,10.469522857666016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,power_law_1.2,0.8993535995483398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,power_law_1.2,1.1015040397644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,power_law_1.2,1.3087679862976074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,power_law_1.2,1.6018495559692383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,power_law_1.2,1.7452096939086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,power_law_1.2,2.339520072937012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,power_law_1.2,3.0155712127685548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,power_law_1.2,3.8416576385498047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,power_law_1.2,5.836204910278321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,power_law_1.2,11.737721252441407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.07141119837760926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.09435520172119141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,power_law_1.01,0.149017596244812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,power_law_1.01,0.23423359394073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,power_law_1.01,0.3173696041107178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,power_law_1.01,0.07078400254249573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,power_law_1.01,0.37470719814300535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,power_law_1.01,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,power_law_1.01,0.47528958320617676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,power_law_1.01,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,power_law_1.01,0.5014783859252929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,power_law_1.01,0.06689919829368592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,power_law_1.01,0.5223680019378663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,power_law_1.01,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,power_law_1.01,0.546950387954712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,power_law_1.01,0.07159039974212647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,power_law_1.01,0.5727551937103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,power_law_1.01,0.07571200132369996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,power_law_1.01,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,power_law_1.01,0.5772543907165527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,power_law_1.01,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,power_law_1.01,0.6178175926208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,power_law_1.01,0.08833919763565064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,power_law_1.01,0.08388479948043823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,power_law_1.01,0.6263936042785645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,power_law_1.01,0.09617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,power_law_1.01,0.6483200073242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,power_law_1.01,0.11749119758605957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,power_law_1.01,0.11952639818191528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,power_law_1.01,0.722867202758789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,power_law_1.2,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,power_law_1.01,0.12711679935455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,power_law_1.2,0.07096319794654846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,power_law_1.01,0.8010944366455078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,power_law_1.01,0.16581759452819825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,power_law_1.2,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,power_law_1.01,0.23196799755096437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,power_law_1.01,0.8195391654968261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,power_law_1.2,0.06747519969940186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,power_law_1.01,0.3050751924514771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,power_law_1.2,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,power_law_1.01,0.9370880126953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,power_law_1.01,0.3386559963226318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,power_law_1.2,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,power_law_1.01,0.46421117782592775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,power_law_1.01,1.054643154144287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,power_law_1.2,0.07071999907493591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.0738048017024994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,power_law_1.01,0.5404032230377197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,power_law_1.2,0.0735871970653534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,power_law_1.01,1.2539135932922363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,power_law_1.01,0.874835205078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.09550079703330994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,power_law_1.2,0.07648640275001525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,power_law_1.01,1.147430419921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,power_law_1.01,1.5072511672973632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,power_law_1.2,0.08506879806518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.10882560014724732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,power_law_1.01,1.750547218322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,power_law_1.2,0.08119040131568908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,power_law_1.01,1.917465591430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,power_law_1.2,0.15450880527496338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,power_law_1.01,2.421887969970703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,power_law_1.2,0.08794239759445191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,power_law_1.01,2.293894386291504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,power_law_1.2,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,power_law_1.01,3.1212799072265627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,power_law_1.2,0.2124608039855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,power_law_1.2,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,power_law_1.01,5.03306884765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,power_law_1.01,3.0270784378051756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,power_law_1.2,0.2890559911727905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,power_law_1.2,0.12195199728012085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,power_law_1.2,0.12379519939422608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,power_law_1.01,9.598278045654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,power_law_1.2,0.340447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,power_law_1.01,3.915903854370117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,power_law_1.2,0.12707200050354003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,power_law_1.2,0.4530943870544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,power_law_1.2,0.17069439888000487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,power_law_1.01,4.6662849426269535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,power_law_1.2,0.19260799884796143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,power_law_1.2,0.4797183990478516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,power_law_1.2,0.27472639083862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,power_law_1.01,7.132902526855469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,power_law_1.2,0.4989759922027588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,power_law_1.2,0.3611520051956177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,power_law_1.2,0.4998079776763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,power_law_1.2,0.5387072086334228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,power_law_1.2,0.5985023975372314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,power_law_1.01,13.851986694335938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,power_law_1.2,0.9246975898742675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,power_law_1.2,0.5526336193084717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,power_law_1.2,1.1153984069824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,power_law_1.2,0.5726912021636963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,power_law_1.2,1.7815807342529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,power_law_1.2,0.5906943798065185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,power_law_1.2,2.411609649658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,power_law_1.2,2.9791040420532227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,power_law_1.2,0.6091584205627442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,power_law_1.2,5.159199905395508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,power_law_1.2,0.6357632160186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,power_law_1.2,10.483379364013672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,power_law_1.2,0.7506752014160156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,power_law_1.2,0.8399744033813477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,power_law_1.2,0.8508095741271973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,power_law_1.2,0.9722687721252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,power_law_1.2,1.0654335975646974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,power_law_1.2,1.288691234588623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,power_law_1.2,1.5346495628356933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,power_law_1.2,1.9305280685424804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,power_law_1.01,0.06812160015106201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,power_law_1.01,0.05562880039215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,power_law_1.2,2.3317312240600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,power_law_1.01,0.05502079725265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,power_law_1.01,0.06444159746170045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,power_law_1.2,3.065932846069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,power_law_1.01,0.06381440162658691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,power_law_1.01,0.06584960222244263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,power_law_1.2,3.986707305908203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,power_law_1.01,0.0654591977596283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,power_law_1.01,0.06689280271530151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,power_law_1.2,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,power_law_1.2,4.817375946044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,power_law_1.01,0.06872959733009339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,power_law_1.2,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,power_law_1.01,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,power_law_1.2,0.06259199976921082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,power_law_1.2,7.238931274414062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,power_law_1.2,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,power_law_1.01,0.07262719869613647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,power_law_1.2,0.06321280002593994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,power_law_1.01,0.0750976026058197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,power_law_1.2,0.06485120058059693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,power_law_1.2,14.40386505126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,power_law_1.01,0.0828607976436615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,power_law_1.2,0.06506879925727845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,power_law_1.01,0.10150400400161744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,power_law_1.2,0.06854400038719177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,power_law_1.01,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,power_law_1.01,0.10744320154190064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,power_law_1.2,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,power_law_1.01,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,power_law_1.01,0.11605119705200195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,power_law_1.2,0.07633280158042907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,power_law_1.01,0.051910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,power_law_1.01,0.14984320402145385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,power_law_1.01,0.060096001625061034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,power_law_1.01,0.1568063974380493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,power_law_1.2,0.07323520183563233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,power_law_1.01,0.06152960062026978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,power_law_1.01,0.2153791904449463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,power_law_1.2,0.08105599880218506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,power_law_1.01,0.061740797758102414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,power_law_1.01,0.253273606300354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,power_law_1.01,0.06602240204811097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,power_law_1.01,0.3308799982070923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,power_law_1.2,0.09412479996681214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,power_law_1.01,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,power_law_1.01,0.4242688179016113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,power_law_1.2,0.09782400131225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,power_law_1.01,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,power_law_1.2,0.1078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,power_law_1.01,0.6737152099609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,power_law_1.01,0.06787840127944947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,power_law_1.2,0.15968639850616456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,power_law_1.01,0.8744128227233887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,power_law_1.2,0.1543552041053772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,power_law_1.01,1.1764863967895507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,power_law_1.01,0.07156479954719544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,power_law_1.2,0.22275838851928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,power_law_1.01,1.6399616241455077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,power_law_1.2,0.2673919916152954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,power_law_1.01,1.976038360595703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,power_law_1.01,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,power_law_1.2,0.3521791934967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,power_law_1.01,3.8581504821777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,power_law_1.01,0.09263359904289245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,power_law_1.2,0.4912384033203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,power_law_1.01,0.09756799936294555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,power_law_1.2,0.7404928207397461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,power_law_1.01,7.568473815917969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,power_law_1.01,0.10001920461654663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,power_law_1.2,1.086796760559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,power_law_1.01,0.10802559852600098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,power_law_1.2,1.6219263076782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,power_law_1.01,0.13915519714355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,power_law_1.2,1.6088384628295898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,power_law_1.01,0.1586176037788391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,power_law_1.01,0.20038399696350098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,power_law_1.2,1.8205951690673827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,power_law_1.01,0.24276480674743653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,power_law_1.2,0.042668798565864564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,power_law_1.2,4.035718536376953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,power_law_1.01,0.3232640027999878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,power_law_1.2,0.04881280064582825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,power_law_1.2,7.288563537597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,power_law_1.01,0.4899775981903076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,power_law_1.2,0.05148800015449524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,power_law_1.01,0.6062848091125488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,power_law_1.2,0.061318397521972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,power_law_1.01,0.902239990234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,power_law_1.2,0.06111360192298889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,power_law_1.01,1.0883968353271485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,power_law_1.2,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,power_law_1.2,0.06684799790382386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,power_law_1.01,1.5080191612243652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,power_law_1.2,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,power_law_1.01,2.127961540222168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,power_law_1.2,0.06746879816055298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,power_law_1.01,4.913433456420899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,power_law_1.2,0.06972159743309021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,power_law_1.2,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,power_law_1.2,0.07299200296401978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,power_law_1.2,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,power_law_1.2,0.09306880235671997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,power_law_1.2,0.09633920192718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,power_law_1.2,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,power_law_1.2,0.11395200490951538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,power_law_1.2,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,power_law_1.2,0.15819519758224487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,power_law_1.2,0.20919039249420165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,power_law_1.01,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,power_law_1.2,0.28231680393218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,power_law_1.2,0.35111680030822756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,power_law_1.01,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,power_law_1.2,0.4784895896911621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,power_law_1.01,0.05974400043487549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,power_law_1.01,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,power_law_1.2,0.6406464099884033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,power_law_1.01,0.06094719767570496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,power_law_1.2,0.9726783752441406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,power_law_1.01,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,power_law_1.2,1.2194496154785157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,power_law_1.01,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,power_law_1.2,1.6206592559814452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,power_law_1.01,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,power_law_1.2,2.6233600616455077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,power_law_1.2,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,power_law_1.2,5.150995254516602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,power_law_1.2,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,power_law_1.01,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,power_law_1.2,0.061587202548980716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,power_law_1.01,0.07018240094184876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,power_law_1.01,0.07365120053291321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,power_law_1.2,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,power_law_1.01,0.08410879969596863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,power_law_1.2,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,power_law_1.2,0.06424319744110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,power_law_1.2,0.06506879925727845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,power_law_1.2,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,power_law_1.2,0.06891520023345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,power_law_1.2,0.07121279835700989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,power_law_1.2,0.07239680290222168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,power_law_1.2,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,power_law_1.2,0.08636800050735474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,power_law_1.2,0.09127039909362793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,power_law_1.2,0.10316159725189208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,power_law_1.2,0.12136960029602051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,power_law_1.2,0.14697599411010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,power_law_1.2,0.17688319683074952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,power_law_1.2,0.2301248073577881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,power_law_1.01,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,power_law_1.2,0.27847039699554443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,power_law_1.2,0.39027841091156007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,power_law_1.2,0.49657602310180665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,power_law_1.01,0.08650879859924317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,power_law_1.2,0.7134463787078857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,power_law_1.01,0.08734719753265381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,power_law_1.2,0.9321727752685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,power_law_1.01,0.09164159893989562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,power_law_1.2,1.1642304420471192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,power_law_1.01,0.09184640049934387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,power_law_1.2,1.8718015670776367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,power_law_1.01,0.1016767978668213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,power_law_1.2,3.797932815551758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,power_law_1.01,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,power_law_1.01,0.10414079427719117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,power_law_1.01,0.12209279537200927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,power_law_1.01,0.12051199674606324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,power_law_1.01,0.13690240383148194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,power_law_1.01,0.1519744038581848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,power_law_1.01,0.1737663984298706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,power_law_1.01,0.1723199963569641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,power_law_1.01,0.23582079410552978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,power_law_1.01,0.26672000885009767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,power_law_1.01,0.3578815937042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,power_law_1.01,0.5096320152282715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,power_law_1.01,0.6683519840240478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,power_law_1.01,0.8878848075866699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,power_law_1.01,1.2989376068115235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,power_law_1.2,0.0887615978717804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,power_law_1.2,0.08895999789237977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,power_law_1.01,1.6608064651489258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,power_law_1.2,0.08977280259132385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,power_law_1.01,2.6975040435791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,power_law_1.2,0.08549119830131531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,power_law_1.01,3.9807743072509765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,power_law_1.2,0.08609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,power_law_1.01,4.785843276977539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,power_law_1.2,0.08895999789237977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,power_law_1.01,7.489817810058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,power_law_1.2,0.09223679900169372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,power_law_1.2,0.09244160056114196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,power_law_1.2,0.09797760248184204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,power_law_1.01,21.208345031738283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,power_law_1.2,0.101254403591156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,power_law_1.2,0.10494719743728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,power_law_1.2,0.11804159879684448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,power_law_1.2,0.11108479499816895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,power_law_1.2,0.1356735944747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,power_law_1.2,0.16814719438552855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,power_law_1.2,0.17374720573425292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,power_law_1.2,0.2072767972946167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,power_law_1.2,0.2898751974105835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,power_law_1.2,0.2904896020889282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,power_law_1.2,0.39146239757537843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,power_law_1.2,0.45145602226257325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,power_law_1.2,0.7027455806732178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,power_law_1.2,0.9038784027099609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,power_law_1.2,1.309984016418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,power_law_1.2,1.724710464477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,power_law_1.2,2.788230323791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,power_law_1.2,3.451551818847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,power_law_1.01,0.09844480156898498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,power_law_1.2,5.159187316894531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,power_law_1.2,8.182041931152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,power_law_1.01,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,power_law_1.01,0.0819711983203888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,power_law_1.2,16.174176025390626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,power_law_1.01,0.08472959995269776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,power_law_1.01,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,power_law_1.01,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,power_law_1.01,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,power_law_1.01,0.09333119988441467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,power_law_1.01,0.0920960009098053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,power_law_1.01,0.09946879744529724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,power_law_1.01,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,power_law_1.01,0.11217279434204101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,power_law_1.01,0.13511040210723876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,power_law_1.01,0.14122240543365477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,power_law_1.01,0.14349440336227418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,power_law_1.01,0.17889280319213868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,power_law_1.01,0.2280895948410034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,power_law_1.01,0.3095936059951782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,power_law_1.01,0.40236802101135255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,power_law_1.01,0.4662655830383301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,power_law_1.01,0.6597951889038086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,power_law_1.01,0.9256064414978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,power_law_1.01,1.067136001586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,power_law_1.2,0.1020799994468689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,power_law_1.01,1.9961151123046874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,power_law_1.2,0.06993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,power_law_1.01,2.7649280548095705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,power_law_1.2,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,power_law_1.2,0.08098559975624084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,power_law_1.01,4.201196670532227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,power_law_1.2,0.08262400031089782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,power_law_1.01,7.2828224182128904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,power_law_1.2,0.08467199802398681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,power_law_1.2,0.08693119883537292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,power_law_1.01,11.12630386352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,power_law_1.2,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,power_law_1.2,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,power_law_1.2,0.09075199961662292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,power_law_1.2,0.0906175971031189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,power_law_1.2,0.0992255985736847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,power_law_1.2,0.10329600572586059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,power_law_1.2,0.1123263955116272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,power_law_1.2,0.13034240007400513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,power_law_1.2,0.1493888020515442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,power_law_1.2,0.14960000514984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,power_law_1.2,0.1880959987640381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,power_law_1.2,0.22291839122772217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,power_law_1.2,0.337606406211853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,power_law_1.2,0.3832000017166138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,power_law_1.2,0.5260287761688233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,power_law_1.2,0.7215871810913086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,power_law_1.01,0.05764480233192444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,power_law_1.2,1.0333056449890137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,power_law_1.01,0.061312001943588254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,power_law_1.2,1.4797632217407226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,power_law_1.01,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,power_law_1.2,2.166048049926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,power_law_1.01,0.08118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,power_law_1.2,3.4597824096679686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,power_law_1.01,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,power_law_1.01,0.08357120156288148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,power_law_1.2,4.140518569946289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,power_law_1.01,0.08384640216827392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,power_law_1.2,5.267129516601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,power_law_1.01,0.08752639889717102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,power_law_1.01,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,power_law_1.2,13.89248046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,power_law_1.01,0.08979200124740601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,power_law_1.01,0.0907904028892517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,power_law_1.01,0.09286400079727172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,power_law_1.01,0.09449599981307984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,power_law_1.01,0.10001920461654663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,power_law_1.01,0.11571840047836304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,power_law_1.01,0.12132480144500732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,power_law_1.01,0.12617599964141846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,power_law_1.01,0.1454975962638855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,power_law_1.01,0.1759935975074768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,power_law_1.01,0.2253567934036255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,power_law_1.01,0.2814784049987793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,power_law_1.01,0.3920703887939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,power_law_1.01,0.4658048152923584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,power_law_1.01,0.697433614730835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,power_law_1.01,0.9575039863586425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,power_law_1.2,0.05278080105781555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,power_law_1.01,1.3386560440063477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,power_law_1.2,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,power_law_1.01,1.78287353515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,power_law_1.2,0.0683135986328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,power_law_1.01,2.4599231719970702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,power_law_1.2,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,power_law_1.01,3.316384124755859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,power_law_1.2,0.0810368001461029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,power_law_1.2,0.08410879969596863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,power_law_1.01,8.147846221923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,power_law_1.2,0.08573439717292786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,power_law_1.2,0.08882560133934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,power_law_1.2,0.08820480108261108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,power_law_1.2,0.09291520118713378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,power_law_1.01,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,power_law_1.2,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,power_law_1.01,0.09166719913482665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,power_law_1.2,0.09249280095100403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,power_law_1.01,0.1072383999824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,power_law_1.2,0.09740800261497498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,power_law_1.01,0.1217919945716858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,power_law_1.2,0.10234240293502808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,power_law_1.01,0.14963200092315673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,power_law_1.2,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,power_law_1.01,0.17646080255508423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,power_law_1.2,0.12178560495376586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,power_law_1.01,0.23381121158599855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,power_law_1.2,0.13346560001373292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,power_law_1.01,0.2829632043838501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,power_law_1.2,0.1668287992477417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,power_law_1.2,0.19573119878768921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,power_law_1.01,0.40010881423950195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,power_law_1.2,0.2141184091567993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,power_law_1.01,0.5080319881439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,power_law_1.2,0.3120448112487793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,power_law_1.01,0.7306431770324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,power_law_1.2,0.4238783836364746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,power_law_1.01,0.9563455581665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,power_law_1.2,0.48592000007629393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,power_law_1.01,1.1945280075073241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,power_law_1.2,0.7601600170135498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,power_law_1.01,1.9092672348022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,power_law_1.01,0.0461760014295578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,power_law_1.2,0.9796799659729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,power_law_1.01,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,power_law_1.01,3.906905746459961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,power_law_1.2,1.6076095581054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,power_law_1.01,0.055801600217819214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,power_law_1.2,1.8464063644409179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,power_law_1.01,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,power_law_1.01,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,power_law_1.2,2.749363136291504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,power_law_1.2,4.520896148681641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,power_law_1.01,0.08508800268173218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,power_law_1.01,0.08529279828071594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,power_law_1.2,8.615257263183594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,power_law_1.01,0.08508800268173218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,power_law_1.01,0.08979200124740601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,power_law_1.01,0.09347839951515198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,power_law_1.01,0.09384959936141968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,power_law_1.01,0.10126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,power_law_1.01,0.11273599863052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,power_law_1.01,0.11273599863052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,power_law_1.01,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,power_law_1.01,0.1430400013923645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,power_law_1.01,0.17417600154876708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,power_law_1.01,0.21267199516296387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,power_law_1.01,0.24606080055236818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,power_law_1.01,0.3318720102310181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,power_law_1.01,0.4051072120666504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,power_law_1.2,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,power_law_1.01,0.586624002456665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,power_law_1.2,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,power_law_1.2,0.06349440217018128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,power_law_1.01,0.7523136138916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,power_law_1.2,0.07995520234107971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,power_law_1.01,1.1072319984436034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,power_law_1.2,0.08138880133628845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,power_law_1.01,1.4594816207885741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,power_law_1.2,0.08261119723320007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,power_law_1.01,1.8266815185546874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,power_law_1.2,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,power_law_1.01,2.985241508483887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,power_law_1.2,0.0840511977672577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,power_law_1.2,0.0862335979938507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,power_law_1.01,6.032870483398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,power_law_1.2,0.08522239923477173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,power_law_1.2,0.0889855980873108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,power_law_1.01,0.12669440507888793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,power_law_1.2,0.09183359742164612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,power_law_1.2,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,power_law_1.01,0.16437120437622071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,power_law_1.2,0.0965503990650177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,power_law_1.01,0.11626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,power_law_1.2,0.1131327986717224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,power_law_1.01,0.10028159618377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,power_law_1.2,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,power_law_1.2,0.1201024055480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,power_law_1.01,0.13672319650650025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,power_law_1.2,0.12729599475860595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,power_law_1.2,0.143014395236969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,power_law_1.01,0.1674623966217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,power_law_1.2,0.15618560314178467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,power_law_1.2,0.16597119569778443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,power_law_1.01,0.19509119987487794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,power_law_1.2,0.0822655975818634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,power_law_1.2,0.20611200332641602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,power_law_1.01,0.2153856039047241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,power_law_1.2,0.09968000054359435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,power_law_1.2,0.24707839488983155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,power_law_1.2,0.32039039134979247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,power_law_1.01,0.2237760066986084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,power_law_1.2,0.13223040103912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,power_law_1.2,0.3945280075073242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,power_law_1.01,0.22766718864440919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,power_law_1.2,0.15639040470123292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,power_law_1.2,0.5604159832000732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,power_law_1.01,0.23831679821014404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,power_law_1.2,0.1891584038734436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,power_law_1.2,0.712992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,power_law_1.01,0.23914239406585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,power_law_1.2,1.0316415786743165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,power_law_1.2,0.20842878818511962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,power_law_1.2,1.3660863876342773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,power_law_1.01,0.24630401134490967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,power_law_1.2,0.21251199245452881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,power_law_1.2,1.7025663375854492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,power_law_1.2,0.22232959270477295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,power_law_1.01,0.25511679649353025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,power_law_1.2,2.7341503143310546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,power_law_1.2,0.22583680152893065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,power_law_1.01,0.25428481101989747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,power_law_1.2,5.687577438354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,power_law_1.2,0.24958720207214355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,power_law_1.01,0.2547008037567139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,power_law_1.2,0.23687679767608644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,power_law_1.01,0.2772288084030151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,power_law_1.2,0.2590015888214111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,power_law_1.01,0.30037119388580324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,power_law_1.2,0.2559360027313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,power_law_1.01,0.337446403503418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,power_law_1.2,0.2757951974868774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,power_law_1.01,0.4064511775970459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,power_law_1.2,0.2913536071777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,power_law_1.01,0.39560320377349856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,power_law_1.01,0.11908479928970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,power_law_1.2,0.3214591979980469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,power_law_1.01,0.5231872081756592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,power_law_1.01,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,power_law_1.2,0.3509696006774902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,power_law_1.01,0.5833920001983642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,power_law_1.01,0.08038399815559387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,power_law_1.2,0.42570881843566893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,power_law_1.01,0.774073600769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,power_law_1.01,0.09756799936294555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,power_law_1.2,0.4273536205291748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,power_law_1.01,0.9616703987121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,power_law_1.01,0.12379519939422608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,power_law_1.2,0.5256576061248779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,power_law_1.01,1.3153471946716309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,power_law_1.01,0.15532159805297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,power_law_1.2,0.638099193572998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,power_law_1.01,1.677235221862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,power_law_1.01,0.1983423948287964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,power_law_1.2,0.822815990447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,power_law_1.01,2.2750528335571287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,power_law_1.01,0.22721920013427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,power_law_1.2,1.0622207641601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,power_law_1.01,3.184556770324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,power_law_1.01,0.22474238872528077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,power_law_1.2,1.5195520401000977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,power_law_1.01,0.2302720069885254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,power_law_1.2,1.9707263946533202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,power_law_1.01,6.882841491699219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,power_law_1.01,0.23558399677276612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,power_law_1.2,2.3002496719360352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,power_law_1.01,0.24523520469665527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,power_law_1.2,3.7463104248046877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,power_law_1.01,0.2536384105682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,power_law_1.01,0.2622208118438721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,power_law_1.2,7.916889953613281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,power_law_1.01,0.27820799350738523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,power_law_1.01,0.2844928026199341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,power_law_1.01,0.28845438957214353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,power_law_1.01,0.32222719192504884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,power_law_1.2,0.10289280414581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,power_law_1.01,0.33720319271087645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,power_law_1.2,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,power_law_1.01,0.3982208013534546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,power_law_1.2,0.07708799839019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,power_law_1.01,0.43386240005493165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,power_law_1.2,0.10207359790802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,power_law_1.01,0.5234879970550537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,power_law_1.2,0.12419840097427368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,power_law_1.01,0.6259647846221924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,power_law_1.2,0.15736960172653197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,power_law_1.01,0.864140796661377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,power_law_1.2,0.20448000431060792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,power_law_1.01,0.9923392295837402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,power_law_1.2,0.2151103973388672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,power_law_1.01,1.401740837097168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,power_law_1.2,0.21226239204406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,power_law_1.01,1.7496896743774415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,power_law_1.2,0.22188160419464112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,power_law_1.01,2.237721633911133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,power_law_1.2,0.2425663948059082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,power_law_1.2,0.23887999057769777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,power_law_1.01,3.2966846466064452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,power_law_1.2,0.2503423929214478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,power_law_1.01,6.509235382080078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,power_law_1.2,0.2673408031463623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,power_law_1.2,0.27799038887023925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,power_law_1.2,0.2941760063171387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,power_law_1.2,0.30789759159088137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,power_law_1.2,0.3420991897583008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,power_law_1.2,0.35029120445251466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,power_law_1.2,0.40517759323120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,power_law_1.2,0.44163198471069337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,power_law_1.01,0.06934400200843811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,power_law_1.2,0.532147216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,power_law_1.01,0.09166079759597778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,power_law_1.2,0.6491007804870605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,power_law_1.01,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,power_law_1.2,0.8887104034423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,power_law_1.01,0.09883520007133484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,power_law_1.2,1.071180820465088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,power_law_1.2,0.06936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,power_law_1.01,0.14061440229415895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,power_law_1.2,1.4267135620117188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,power_law_1.2,0.09189760088920593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,power_law_1.01,0.1596735954284668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,power_law_1.2,1.8221887588500976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,power_law_1.2,0.07612800002098083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,power_law_1.01,0.2194751977920532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,power_law_1.2,2.1889856338500975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,power_law_1.2,0.10377600193023681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,power_law_1.01,0.2209088087081909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,power_law_1.2,0.12874879837036132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,power_law_1.01,0.23566079139709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,power_law_1.2,3.669267272949219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,power_law_1.2,0.15702400207519532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,power_law_1.01,0.24241280555725098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,power_law_1.2,7.337651062011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,power_law_1.2,0.22110719680786134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,power_law_1.01,0.26042239665985106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,power_law_1.2,0.23094398975372316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,power_law_1.01,0.26369919776916506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,power_law_1.2,0.23708798885345458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,power_law_1.01,0.2710848093032837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,power_law_1.01,0.28090879917144773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,power_law_1.2,0.24486401081085205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,power_law_1.2,0.25961599349975584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,power_law_1.01,0.28275840282440184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,power_law_1.2,0.2686208009719849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,power_law_1.01,0.2964799880981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,power_law_1.2,0.26965761184692383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,power_law_1.01,0.318124794960022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,power_law_1.2,0.2888959884643555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,power_law_1.01,0.349727988243103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,power_law_1.2,0.29526400566101074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,power_law_1.01,0.38863999843597413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,power_law_1.2,0.3022144079208374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,power_law_1.01,0.4412799835205078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,power_law_1.2,0.35381760597229006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,power_law_1.01,0.5080512046813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,power_law_1.2,0.3796224117279053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,power_law_1.01,0.625593614578247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,power_law_1.2,0.40049281120300295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,power_law_1.01,0.7662911891937256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,power_law_1.2,0.4584832191467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,power_law_1.01,1.0165632247924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,power_law_1.2,0.5301631927490235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,power_law_1.01,1.1903552055358886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,power_law_1.2,0.6503680229187012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,power_law_1.01,1.6567615509033202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,power_law_1.2,0.7818624019622803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,power_law_1.01,2.071878433227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,power_law_1.2,1.0083583831787108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,power_law_1.01,2.4960256576538087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,power_law_1.2,1.2559743881225587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,power_law_1.01,3.8319358825683594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,power_law_1.2,1.6923776626586915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,power_law_1.2,2.127193641662598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,power_law_1.01,7.765119934082032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,power_law_1.01,0.06992639899253845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,power_law_1.2,2.620550346374512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,power_law_1.2,4.328985595703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,power_law_1.01,0.0859008014202118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,power_law_1.01,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,power_law_1.2,8.546227264404298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,power_law_1.01,0.16926079988479614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,power_law_1.01,0.2044991970062256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,power_law_1.01,0.26899840831756594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,power_law_1.01,0.287827205657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,power_law_1.01,0.2993088006973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,power_law_1.01,0.3070847988128662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,power_law_1.01,0.3175296068191528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,power_law_1.01,0.33330559730529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,power_law_1.01,0.3382080078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,power_law_1.01,0.3560192108154297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,power_law_1.01,0.07754240036010743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,power_law_1.01,0.3582911968231201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,power_law_1.01,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,power_law_1.01,0.3791615962982178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,power_law_1.01,0.057894402742385866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,power_law_1.01,0.4584383964538574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,power_law_1.01,0.06240000128746033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,power_law_1.01,0.5329728126525879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,power_law_1.2,0.0750976026058197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,power_law_1.01,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,power_law_1.01,0.5088064193725585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,power_law_1.01,0.07692800164222717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,power_law_1.2,0.06888319849967957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,power_law_1.01,0.6095615863800049
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,power_law_1.01,0.07937920093536377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,power_law_1.2,0.07831680178642272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,power_law_1.01,0.7170815944671631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,power_law_1.01,0.08206080198287964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,power_law_1.2,0.09224320054054261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,power_law_1.01,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,power_law_1.01,0.882579231262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,power_law_1.01,0.08677120208740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,power_law_1.2,0.1196671962738037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,power_law_1.01,1.0353343963623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,power_law_1.01,0.08677120208740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,power_law_1.2,0.15164159536361693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,power_law_1.01,1.3501184463500977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,power_law_1.01,0.09190400242805481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,power_law_1.2,0.1958847999572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,power_law_1.01,1.7103616714477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,power_law_1.01,0.09372159838676453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,power_law_1.2,0.26550400257110596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,power_law_1.01,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,power_law_1.01,2.345676803588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,power_law_1.2,0.2810688018798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,power_law_1.01,0.10559359788894654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,power_law_1.01,2.944281578063965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,power_law_1.2,0.2947776079177856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,power_law_1.01,0.10929919481277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,power_law_1.01,3.5664512634277346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,power_law_1.01,0.12055039405822754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,power_law_1.2,0.3171135902404785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,power_law_1.01,0.13346560001373292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,power_law_1.2,0.3261248111724854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,power_law_1.01,5.472735977172851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,power_law_1.01,0.1512768030166626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,power_law_1.2,0.3271424055099487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,power_law_1.01,0.17319040298461913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,power_law_1.01,10.571846771240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,power_law_1.2,0.34703359603881834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,power_law_1.01,0.23113598823547363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,power_law_1.2,0.42195839881896974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,power_law_1.01,0.2817408084869385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,power_law_1.2,0.437113618850708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,power_law_1.01,0.3509632110595703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,power_law_1.2,0.44080638885498047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,power_law_1.01,0.5231935977935791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,power_law_1.2,0.4111167907714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,power_law_1.01,0.66593918800354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,power_law_1.2,0.4764544010162354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,power_law_1.01,0.842470359802246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,power_law_1.2,0.5210944175720215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,power_law_1.01,1.1109760284423829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,power_law_1.2,0.6238912105560303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,power_law_1.01,1.6383232116699218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,power_law_1.2,0.7273280143737793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,power_law_1.01,3.4598209381103517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,power_law_1.2,0.8862015724182128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,power_law_1.2,1.039020824432373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,power_law_1.2,1.3415167808532715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,power_law_1.2,1.7333120346069335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,power_law_1.2,2.344416046142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,power_law_1.01,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,power_law_1.2,2.9557504653930664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,power_law_1.01,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,power_law_1.01,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,power_law_1.2,3.5485824584960937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,power_law_1.01,0.06663680076599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,power_law_1.01,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,power_law_1.2,5.455532836914062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,power_law_1.01,0.08406400084495544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,power_law_1.01,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,power_law_1.2,10.507955169677734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,power_law_1.01,0.08815360069274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,power_law_1.01,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,power_law_1.01,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,power_law_1.01,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,power_law_1.2,0.053990399837493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,power_law_1.01,0.09389439821243287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,power_law_1.01,0.09839360117912292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,power_law_1.2,0.046412798762321475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,power_law_1.01,0.10413440465927123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,power_law_1.2,0.05133439898490906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,power_law_1.01,0.1098688006401062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,power_law_1.2,0.06056320071220398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,power_law_1.01,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,power_law_1.2,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,power_law_1.01,0.12645119428634644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,power_law_1.2,0.08470399975776673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,power_law_1.01,0.1418176054954529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,power_law_1.01,0.16782079935073851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,power_law_1.2,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,power_law_1.01,0.19608960151672364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,power_law_1.2,0.0877951979637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,power_law_1.01,0.24051198959350586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,power_law_1.2,0.09331200122833253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,power_law_1.01,0.30320000648498535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,power_law_1.2,0.09597439765930176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,power_law_1.01,0.4129727840423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,power_law_1.2,0.09759359955787658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,power_law_1.01,0.5640960216522217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,power_law_1.2,0.10725120306015015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,power_law_1.01,0.7195583820343018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,power_law_1.2,0.1144063949584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,power_law_1.01,0.9714624404907226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,power_law_1.01,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,power_law_1.2,0.11419520378112794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,power_law_1.01,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,power_law_1.01,1.1756287574768067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,power_law_1.2,0.13223040103912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,power_law_1.01,0.04801279902458191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,power_law_1.01,1.8291648864746093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,power_law_1.2,0.14696320295333862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,power_law_1.2,0.17728639841079713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,power_law_1.01,3.766764831542969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,power_law_1.01,0.06704639792442321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,power_law_1.2,0.19449599981307983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,power_law_1.01,0.08670719861984252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,power_law_1.2,0.24444799423217772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,power_law_1.01,0.09387519955635071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,power_law_1.2,0.34031360149383544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,power_law_1.01,0.10105600357055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,power_law_1.2,0.4188992023468018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,power_law_1.01,0.09633280038833618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,power_law_1.2,0.5215551853179932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,power_law_1.01,0.10124800205230713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,power_law_1.2,0.8006848335266114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,power_law_1.01,0.11109119653701782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,power_law_1.2,1.0536383628845214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,power_law_1.01,0.1131327986717224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,power_law_1.01,0.1201024055480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,power_law_1.2,1.2829312324523925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,power_law_1.01,0.11149439811706544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,power_law_1.2,2.336697578430176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,power_law_1.01,0.11721600294113159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,power_law_1.01,0.12009600400924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,power_law_1.2,4.175385665893555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,power_law_1.01,0.13156479597091675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,power_law_1.01,0.1512063980102539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,power_law_1.01,0.17375999689102173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,power_law_1.01,0.20774400234222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,power_law_1.01,0.23192319869995118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,power_law_1.01,0.2921344041824341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,power_law_1.01,0.36012160778045654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,power_law_1.2,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,power_law_1.01,0.4969151973724365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,power_law_1.2,0.044326400756835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,power_law_1.01,0.6083392143249512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,power_law_1.2,0.048019200563430786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,power_law_1.01,0.8166272163391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,power_law_1.2,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,power_law_1.01,1.1002367973327636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,power_law_1.01,1.3370304107666016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,power_law_1.01,2.194259262084961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,power_law_1.01,4.062681579589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,power_law_1.01,0.04211199879646301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,power_law_1.01,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,power_law_1.01,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,power_law_1.01,0.06709759831428527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,power_law_1.01,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,power_law_1.01,0.11206400394439697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,power_law_1.01,0.11830400228500366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,power_law_1.01,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,power_law_1.01,0.12280319929122925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,power_law_1.01,0.1258944034576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,power_law_1.01,0.13264000415802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,power_law_1.01,0.139193594455719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,power_law_1.01,0.1422719955444336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,power_law_1.01,0.14206080436706542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,power_law_1.01,0.15066239833831788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,power_law_1.01,0.15407999753952026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,power_law_1.01,0.17032959461212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,power_law_1.2,0.04186240136623383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,power_law_1.01,0.20432639122009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,power_law_1.2,0.046777600049972536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,power_law_1.01,0.23340160846710206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,power_law_1.01,0.2909503936767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,power_law_1.2,0.054150402545928955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,power_law_1.01,0.3374399900436401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,power_law_1.2,0.06357759833335877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,power_law_1.2,0.058297598361968996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,power_law_1.01,0.4388160228729248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,power_law_1.2,0.07503359913825988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,power_law_1.2,0.05953279733657837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,power_law_1.2,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,power_law_1.01,0.5375232219696044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,power_law_1.2,0.07468159794807434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,power_law_1.2,0.12008960247039795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,power_law_1.01,0.7232831954956055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,power_law_1.2,0.0794048011302948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,power_law_1.2,0.12622720003128052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,power_law_1.01,0.8998144149780274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,power_law_1.2,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,power_law_1.2,0.13238400220870972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,power_law_1.01,1.2696831703186036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,power_law_1.2,0.1336127996444702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,power_law_1.01,1.614156723022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,power_law_1.2,0.08104320168495179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,power_law_1.2,0.14176640510559083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,power_law_1.01,1.9920127868652344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,power_law_1.2,0.08554239869117737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,power_law_1.2,0.15349119901657104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,power_law_1.01,3.086886405944824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,power_law_1.2,0.09187840223312378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,power_law_1.2,0.1590016007423401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,power_law_1.2,0.09330559968948364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,power_law_1.2,0.1438591957092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,power_law_1.01,6.1474048614501955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,power_law_1.2,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,power_law_1.2,0.15238399505615235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,power_law_1.2,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,power_law_1.2,0.158188796043396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,power_law_1.2,0.1047935962677002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,power_law_1.2,0.17191679477691652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,power_law_1.2,0.10807039737701415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,power_law_1.2,0.20590720176696778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,power_law_1.2,0.1258944034576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,power_law_1.2,0.23497600555419923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,power_law_1.2,0.1416383981704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,power_law_1.2,0.29397759437561033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,power_law_1.2,0.15947519540786742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,power_law_1.2,0.337990403175354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,power_law_1.2,0.2078336000442505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,power_law_1.2,0.4358975887298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,power_law_1.2,0.24119040966033936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,power_law_1.2,0.5460864067077636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,power_law_1.2,0.30714240074157717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,power_law_1.2,0.7248832225799561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,power_law_1.2,0.4234367847442627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,power_law_1.2,0.9029760360717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,power_law_1.2,0.5350656032562255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,power_law_1.2,1.2616448402404785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,power_law_1.2,0.8125568389892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,power_law_1.2,1.6189504623413087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,power_law_1.2,0.9288960456848144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,power_law_1.2,1.9956480026245118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,power_law_1.2,1.3759743690490722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,power_law_1.2,3.135161590576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,power_law_1.2,2.3016384124755858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,power_law_1.2,6.208793640136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,power_law_1.2,4.949875259399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,power_law_1.01,0.11253759860992432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,power_law_1.01,0.15352959632873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,power_law_1.01,0.13018239736557008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,power_law_1.01,0.15803519487380982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,power_law_1.01,0.16500480175018312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,power_law_1.01,0.17279360294342042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,power_law_1.01,0.18179839849472046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,power_law_1.01,0.18097280263900756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,power_law_1.01,0.18343039751052856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,power_law_1.01,0.19338879585266114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,power_law_1.01,0.19243520498275757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,power_law_1.01,0.20636799335479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,power_law_1.01,0.21578879356384278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,power_law_1.01,0.2223423957824707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,power_law_1.01,0.22391040325164796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,power_law_1.01,0.26487040519714355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,power_law_1.01,0.2876672029495239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,power_law_1.01,0.33703041076660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,power_law_1.2,0.12213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,power_law_1.01,0.3855616092681885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,power_law_1.2,0.08957440257072449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,power_law_1.01,0.5108992099761963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,power_law_1.2,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,power_law_1.01,0.08677120208740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,power_law_1.01,0.5690559864044189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,power_law_1.2,0.10515199899673462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,power_law_1.01,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,power_law_1.01,0.729420804977417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,power_law_1.01,0.07797120213508606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,power_law_1.2,0.11783679723739623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,power_law_1.01,0.8903871536254883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,power_law_1.01,0.1011072039604187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,power_law_1.2,0.165555202960968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,power_law_1.01,1.2915967941284179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,power_law_1.01,0.12282240390777588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,power_law_1.2,0.16495360136032106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,power_law_1.01,1.6142591476440429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,power_law_1.01,0.16376960277557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,power_law_1.2,0.17272959947586058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,power_law_1.01,1.9899648666381835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,power_law_1.01,0.1762879967689514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,power_law_1.2,0.17948800325393677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,power_law_1.01,3.3852672576904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,power_law_1.01,0.17994879484176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,power_law_1.2,0.18030719757080077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,power_law_1.01,0.17975679636001587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,power_law_1.2,0.19011199474334717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,power_law_1.01,6.823872375488281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,power_law_1.01,0.1842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,power_law_1.2,0.1991487979888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,power_law_1.01,0.1901952028274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,power_law_1.2,0.2054975986480713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,power_law_1.01,0.20351359844207764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,power_law_1.2,0.21103360652923583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,power_law_1.01,0.20062720775604248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,power_law_1.2,0.2319103956222534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,power_law_1.01,0.2075711965560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,power_law_1.2,0.24337921142578126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,power_law_1.01,0.2196671962738037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,power_law_1.2,0.2394495964050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,power_law_1.01,0.2223423957824707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,power_law_1.2,0.2741055965423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,power_law_1.01,0.23586559295654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,power_law_1.2,0.31629440784454343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,power_law_1.01,0.26577279567718504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,power_law_1.2,0.3674880027770996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,power_law_1.01,0.2891135931015015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,power_law_1.2,0.42791042327880857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,power_law_1.01,0.35669760704040526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,power_law_1.2,0.5284607887268067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,power_law_1.01,0.38904318809509275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,power_law_1.2,0.6075200080871582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,power_law_1.01,0.5047552108764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,power_law_1.2,0.8104703903198243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,power_law_1.01,0.541209602355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,power_law_1.2,0.9509696006774903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,power_law_1.01,0.7998720169067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,power_law_1.2,1.504319953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,power_law_1.2,0.065830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,power_law_1.01,0.996889591217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,power_law_1.2,1.9501823425292968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,power_law_1.2,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,power_law_1.01,1.3456640243530273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,power_law_1.2,0.09347839951515198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,power_law_1.2,2.367763137817383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,power_law_1.2,0.09918720126152039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,power_law_1.01,1.7378623962402344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,power_law_1.2,3.8032127380371095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,power_law_1.2,0.10003199577331542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,power_law_1.01,1.9871040344238282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,power_law_1.2,0.10576640367507935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,power_law_1.2,9.244960021972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,power_law_1.01,3.3615169525146484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,power_law_1.2,0.11252479553222657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,power_law_1.2,0.11806080341339112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,power_law_1.01,6.457612609863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,power_law_1.2,0.12146559953689576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,power_law_1.2,0.10944000482559205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,power_law_1.2,0.11886080503463745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,power_law_1.2,0.0925055980682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,power_law_1.2,0.12172800302505493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,power_law_1.2,0.06894720196723939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,power_law_1.2,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,power_law_1.2,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,power_law_1.2,0.15164799690246583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,power_law_1.2,0.09535999894142151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,power_law_1.2,0.1772480010986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,power_law_1.2,0.10806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,power_law_1.2,0.2093951940536499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,power_law_1.2,0.1676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,power_law_1.2,0.22783360481262208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,power_law_1.2,0.17274880409240723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,power_law_1.2,0.2970560073852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,power_law_1.2,0.18302079439163207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,power_law_1.2,0.38757760524749757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,power_law_1.2,0.18526079654693603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,power_law_1.2,0.5145535945892334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,power_law_1.2,0.1821951985359192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,power_law_1.2,0.19714560508728027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,power_law_1.2,0.6119616031646729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,power_law_1.2,0.19981440305709838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,power_law_1.2,0.906668758392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,power_law_1.2,0.20759038925170897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,power_law_1.2,1.1637375831604004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,power_law_1.2,0.21250560283660888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,power_law_1.2,1.4607104301452636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,power_law_1.2,0.22376320362091065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,power_law_1.2,2.178726387023926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,power_law_1.2,0.2469183921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,power_law_1.2,0.24751360416412355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,power_law_1.2,4.638803100585937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,power_law_1.2,0.28460159301757815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,power_law_1.2,0.3008960008621216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,power_law_1.2,0.36373119354248046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,power_law_1.2,0.4298111915588379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,power_law_1.2,0.5313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,power_law_1.2,0.5997759819030761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,power_law_1.2,0.8097151756286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,power_law_1.2,0.9067135810852051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,power_law_1.2,1.433664035797119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,power_law_1.01,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,power_law_1.2,1.888582420349121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,power_law_1.01,0.07545599937438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,power_law_1.2,2.357593536376953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,power_law_1.2,0.0666815996170044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,power_law_1.01,0.07667199969291687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,power_law_1.2,3.4790721893310548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,power_law_1.2,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,power_law_1.01,0.10186879634857178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,power_law_1.2,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,power_law_1.01,0.12459520101547242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,power_law_1.2,8.510176086425782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,power_law_1.2,0.0976256012916565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,power_law_1.01,0.1708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,power_law_1.2,0.12097920179367065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,power_law_1.01,0.1786687970161438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,power_law_1.2,0.16992000341415406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,power_law_1.01,0.18926080465316772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,power_law_1.2,0.18261120319366456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,power_law_1.01,0.19259519577026368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,power_law_1.2,0.1911936044692993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,power_law_1.01,0.19772160053253174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,power_law_1.2,0.19366400241851806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,power_law_1.01,0.20609281063079835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,power_law_1.2,0.20288000106811524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,power_law_1.01,0.20815999507904054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,power_law_1.2,0.21456639766693114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,power_law_1.01,0.211027193069458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,power_law_1.2,0.21989119052886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,power_law_1.01,0.21717119216918945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,power_law_1.2,0.2313472032546997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,power_law_1.01,0.2265984058380127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,power_law_1.2,0.2348479986190796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,power_law_1.01,0.2405247926712036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,power_law_1.2,0.24631040096282958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,power_law_1.01,0.2591615915298462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,power_law_1.2,0.24507520198822022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,power_law_1.01,0.28659839630126954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,power_law_1.2,0.26371839046478274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,power_law_1.01,0.3191551923751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,power_law_1.2,0.2932159900665283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,power_law_1.01,0.39178240299224854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,power_law_1.2,0.3173759937286377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,power_law_1.01,0.44163198471069337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,power_law_1.2,0.3837183952331543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,power_law_1.01,0.5452672004699707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,power_law_1.2,0.44741120338439944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,power_law_1.01,0.6401023864746094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,power_law_1.2,0.5862080097198487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,power_law_1.01,0.876416015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,power_law_1.2,0.7089663982391358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,power_law_1.01,1.0703743934631347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,power_law_1.2,0.8928640365600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,power_law_1.01,1.4760512351989745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,power_law_1.2,1.063468837738037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,power_law_1.01,1.9190784454345704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,power_law_1.2,1.6835968017578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,power_law_1.01,2.2770368576049806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,power_law_1.2,2.0387199401855467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,power_law_1.01,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,power_law_1.01,3.4851520538330076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,power_law_1.01,0.07587199807167053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,power_law_1.2,2.523878479003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,power_law_1.01,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,power_law_1.01,7.291782379150391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,power_law_1.2,4.1573631286621096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,power_law_1.01,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,power_law_1.01,0.1381119966506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,power_law_1.2,7.8071037292480465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,power_law_1.01,0.20570878982543944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,power_law_1.01,0.21267199516296387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,power_law_1.01,0.22680320739746093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,power_law_1.01,0.2339776039123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,power_law_1.01,0.24155519008636475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,power_law_1.01,0.2487231969833374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,power_law_1.01,0.25179519653320315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,power_law_1.01,0.256499195098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,power_law_1.01,0.26817920207977297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,power_law_1.01,0.28353281021118165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,power_law_1.01,0.29745919704437257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,power_law_1.2,0.05971199870109558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,power_law_1.01,0.3173248052597046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,power_law_1.2,0.06996480226516724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,power_law_1.01,0.3683199882507324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,power_law_1.2,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,power_law_1.01,0.420959997177124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,power_law_1.2,0.10478719472885131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,power_law_1.01,0.5100351810455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,power_law_1.2,0.12445440292358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,power_law_1.01,0.5745151996612549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,power_law_1.2,0.20307838916778564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,power_law_1.01,0.7322432041168213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,power_law_1.2,0.21578879356384278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,power_law_1.2,0.2297215938568115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,power_law_1.01,0.9300800323486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,power_law_1.2,0.23420801162719726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,power_law_1.01,1.2063488006591796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,power_law_1.2,0.2432255983352661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,power_law_1.01,1.4740415573120118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,power_law_1.2,0.24649600982666015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,power_law_1.01,2.0390655517578127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,power_law_1.2,0.2569472074508667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,power_law_1.01,2.579955291748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,power_law_1.2,0.26204800605773926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,power_law_1.01,3.1869760513305665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,power_law_1.2,0.27886080741882324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,power_law_1.2,0.29074559211730955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,power_law_1.01,4.897875213623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,power_law_1.2,0.3005759954452515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,power_law_1.01,0.1606335997581482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,power_law_1.2,0.31799681186676027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,power_law_1.01,9.748973083496093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,power_law_1.01,0.1663807988166809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,power_law_1.2,0.16295039653778076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,power_law_1.2,0.37265920639038086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,power_law_1.01,0.2612031936645508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,power_law_1.2,0.41280641555786135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,power_law_1.2,0.16663039922714235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,power_law_1.01,0.10288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,power_law_1.2,0.5002560138702392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,power_law_1.2,0.14657280445098878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,power_law_1.01,0.1362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,power_law_1.2,0.5690559864044189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,power_law_1.2,0.10602240562438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,power_law_1.2,0.7310719966888428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,power_law_1.01,0.18478720188140868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,power_law_1.2,0.136953604221344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,power_law_1.2,0.9477312088012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,power_law_1.01,0.20857601165771483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,power_law_1.2,0.1838528037071228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,power_law_1.2,1.2178560256958009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,power_law_1.01,0.2642816066741943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,power_law_1.2,0.2024768114089966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,power_law_1.2,1.4587200164794922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,power_law_1.01,0.2683712005615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,power_law_1.2,0.25530879497528075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,power_law_1.2,2.0349504470825197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,power_law_1.2,0.2743680000305176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,power_law_1.01,0.2706239938735962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,power_law_1.2,2.6066240310668944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,power_law_1.2,0.26207358837127687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,power_law_1.01,0.29254400730133057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,power_law_1.2,3.2451713562011717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,power_law_1.2,0.28808960914611814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,power_law_1.01,0.27390079498291015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,power_law_1.2,5.005638504028321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,power_law_1.2,0.28009600639343263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,power_law_1.01,0.3056447982788086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,power_law_1.2,0.3067199945449829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,power_law_1.2,9.999078369140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,power_law_1.01,0.32359681129455564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,power_law_1.2,0.31305599212646484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,power_law_1.01,0.3216063976287842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,power_law_1.2,0.31040000915527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,power_law_1.01,0.33615999221801757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,power_law_1.2,0.33068161010742186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,power_law_1.01,0.3377664089202881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,power_law_1.2,0.3634624004364014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,power_law_1.01,0.37404799461364746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,power_law_1.2,0.3874239921569824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,power_law_1.01,0.39371519088745116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,power_law_1.2,0.3993024110794067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,power_law_1.01,0.46497278213500975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,power_law_1.2,0.4699456214904785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,power_law_1.01,0.5148608207702636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,power_law_1.2,0.5514560222625733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,power_law_1.01,0.6320896148681641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,power_law_1.2,0.6900991916656494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,power_law_1.01,0.7183040142059326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,power_law_1.01,0.10003839731216431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,power_law_1.2,0.7126207828521729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,power_law_1.01,0.9128704071044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,power_law_1.01,0.11600639820098876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,power_law_1.2,0.9137408256530761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,power_law_1.01,1.07772798538208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,power_law_1.01,0.17047040462493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,power_law_1.2,1.1932928085327148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,power_law_1.01,0.09758080244064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,power_law_1.01,1.3636287689208983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,power_law_1.2,1.5678720474243164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,power_law_1.01,0.13628799915313722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,power_law_1.01,1.7607423782348632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,power_law_1.01,0.18523520231246948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,power_law_1.2,2.0235456466674804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,power_law_1.01,2.043168067932129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,power_law_1.01,0.21470720767974855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,power_law_1.2,2.460806465148926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,power_law_1.01,3.0982847213745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,power_law_1.01,0.25936639308929443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,power_law_1.2,3.871263885498047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,power_law_1.01,0.26305279731750486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,power_law_1.01,6.057030487060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,power_law_1.01,0.2771903991699219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,power_law_1.2,7.761990356445312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,power_law_1.01,0.2837376117706299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,power_law_1.01,0.3047616004943848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,power_law_1.01,0.30586240291595457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,power_law_1.01,0.31814401149749755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,power_law_1.2,0.11419520378112794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,power_law_1.01,0.33166720867156985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,power_law_1.2,0.11577600240707397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,power_law_1.01,0.34128000736236574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,power_law_1.2,0.10062079429626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,power_law_1.01,0.3584896087646484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,power_law_1.2,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,power_law_1.01,0.37754240036010744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,power_law_1.2,0.13243520259857178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,power_law_1.01,0.40232319831848146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,power_law_1.2,0.16766079664230346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,power_law_1.01,0.46825599670410156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,power_law_1.2,0.19448959827423096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,power_law_1.01,0.5243840217590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,power_law_1.2,0.2420032024383545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,power_law_1.01,0.6552512168884277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,power_law_1.2,0.26001920700073244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,power_law_1.01,0.7592832088470459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,power_law_1.2,0.26903040409088136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,power_law_1.2,0.27968640327453614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,power_law_1.01,0.9694016456604004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,power_law_1.2,0.2944447994232178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,power_law_1.01,1.1617216110229491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,power_law_1.2,0.2995392084121704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,power_law_1.01,1.4994175910949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,power_law_1.2,0.31491200923919677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,power_law_1.01,1.9129087448120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,power_law_1.2,0.3310719966888428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,power_law_1.01,2.376383972167969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,power_law_1.2,0.3431616067886353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,power_law_1.01,3.713926315307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,power_law_1.2,0.36037120819091795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,power_law_1.2,0.40538878440856935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,power_law_1.01,7.077970886230469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,power_law_1.2,0.43267202377319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,power_law_1.2,0.4879615783691406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,power_law_1.2,0.5596223831176758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,power_law_1.2,0.6938111782073975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,power_law_1.2,0.8173695564270019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,power_law_1.2,1.0423680305480958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,power_law_1.01,0.07094399929046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,power_law_1.2,1.182643222808838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,power_law_1.01,0.09223679900169372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,power_law_1.2,1.7370367050170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,power_law_1.01,0.12460160255432129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,power_law_1.2,0.09251199960708618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,power_law_1.2,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,power_law_1.01,0.10944639444351197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,power_law_1.2,1.9166400909423829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,power_law_1.2,0.10848000049591064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,power_law_1.01,0.14876799583435057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,power_law_1.2,2.6557823181152345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,power_law_1.01,0.20325119495391847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,power_law_1.2,0.13797119855880738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,power_law_1.2,4.001318359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,power_law_1.01,0.22985599040985108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,power_law_1.2,0.18056319952011107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,power_law_1.2,0.19714560508728027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,power_law_1.01,0.28065919876098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,power_law_1.2,8.644338989257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,power_law_1.2,0.2702719926834106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,power_law_1.01,0.29171841144561766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,power_law_1.2,0.2788671970367432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,power_law_1.01,0.2933504104614258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,power_law_1.2,0.285427188873291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,power_law_1.01,0.31251840591430663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,power_law_1.2,0.3120448112487793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,power_law_1.01,0.3273216009140015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,power_law_1.2,0.32883200645446775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,power_law_1.01,0.32981760501861573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,power_law_1.2,0.3398911952972412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,power_law_1.01,0.36463360786437987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,power_law_1.2,0.373471999168396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,power_law_1.01,0.38755838871002196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,power_law_1.2,0.38679039478302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,power_law_1.01,0.4080512046813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,power_law_1.2,0.40440959930419923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,power_law_1.01,0.3939007997512817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,power_law_1.2,0.3947839975357056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,power_law_1.01,0.42729601860046384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,power_law_1.2,0.4457791805267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,power_law_1.01,0.45842561721801756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,power_law_1.2,0.4810175895690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,power_law_1.01,0.5460095882415772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,power_law_1.2,0.5600575923919677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,power_law_1.01,0.6071040153503418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,power_law_1.2,0.6268223762512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,power_law_1.01,0.7285632133483887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,power_law_1.2,0.7740608215332031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,power_law_1.01,0.8870656013488769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,power_law_1.2,0.924403190612793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,power_law_1.01,1.135904026031494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,power_law_1.2,1.1896127700805663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,power_law_1.01,1.3353792190551759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,power_law_1.2,1.427577590942383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,power_law_1.01,1.8213695526123046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,power_law_1.2,1.8824575424194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,power_law_1.01,2.300320053100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,power_law_1.2,2.377248001098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,power_law_1.01,2.695852851867676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,power_law_1.2,2.83702392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,power_law_1.01,4.263808059692383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,power_law_1.2,4.5708671569824215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,power_law_1.01,7.802137756347657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,power_law_1.2,8.764749145507812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,power_law_1.01,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,power_law_1.01,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,power_law_1.01,0.1059008002281189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,power_law_1.01,0.1225600004196167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,power_law_1.01,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,8,power_law_1.01,0.03326080143451691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,power_law_1.01,0.2409343957901001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,8,power_law_1.01,0.032652801275253295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,1,8,power_law_1.2,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,power_law_1.01,0.2732928037643433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,8,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,1,8,power_law_1.2,0.03495039939880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,8,power_law_1.01,0.03346560001373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,power_law_1.01,0.35317120552062986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,1,8,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,8,power_law_1.01,0.03633280098438263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,power_law_1.01,0.37241599559783933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,1,8,power_law_1.2,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,8,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,1,8,power_law_1.2,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,power_law_1.01,0.3773184061050415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,8,power_law_1.01,0.0414463996887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,1,8,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,8,power_law_1.01,0.04677119851112366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,power_law_1.01,0.40845441818237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,1,8,power_law_1.2,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,8,power_law_1.01,0.04267520010471344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,1,8,power_law_1.2,0.04784640073776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,power_law_1.01,0.42279682159423826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,8,power_law_1.01,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,1,8,power_law_1.2,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,8,power_law_1.01,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,power_law_1.01,0.42646398544311526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,1,8,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,8,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,power_law_1.2,0.06853119730949402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,power_law_1.01,0.48136320114135744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,1,8,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,8,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,1,8,power_law_1.2,0.06320639848709106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,power_law_1.2,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,power_law_1.01,0.5259967803955078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,8,power_law_1.01,0.07973759770393371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,1,8,power_law_1.2,0.07017599940299987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,power_law_1.2,0.09270399808883667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,8,power_law_1.01,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,power_law_1.01,0.5583615779876709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,1,8,power_law_1.2,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,8,power_law_1.01,0.09450240135192871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,power_law_1.2,0.1232192039489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,1,8,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,power_law_1.01,0.49120640754699707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,8,power_law_1.01,0.1356608033180237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,1,8,power_law_1.2,0.10353280305862426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,power_law_1.2,0.16745599508285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,power_law_1.01,0.5645055770874023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,8,power_law_1.01,0.1774399995803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,1,8,power_law_1.2,0.13448959589004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,power_law_1.2,0.21742720603942872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.01,0.22371840476989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,1,8,power_law_1.2,0.18568960428237916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,power_law_1.01,0.6153024196624756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.01,0.3631808042526245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.2,0.2628864049911499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,power_law_1.2,0.2471168041229248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,power_law_1.01,0.7297855854034424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.01,0.4332287788391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.2,0.3845376014709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,power_law_1.2,0.3537856101989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,power_law_1.01,0.8227775573730469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.01,0.7056191921234131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.2,0.4772928237915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.2,0.7073023796081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.01,0.908358383178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,power_law_1.2,0.36693758964538575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,power_law_1.01,1.0111743927001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.2,0.8736063957214355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.01,1.3378368377685548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,power_law_1.2,0.38085761070251467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,power_law_1.01,1.2149503707885743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.2,1.4030207633972167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.01,1.505568027496338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,power_law_1.2,0.4009280204772949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,power_law_1.01,1.5780672073364257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.2,1.7599807739257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.01,2.499263954162598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.2,2.4829248428344726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.01,3.6217727661132812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,power_law_1.2,0.4388095855712891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,power_law_1.01,1.963315200805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.2,3.5347713470458983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,8,power_law_1.01,4.462259292602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,power_law_1.2,0.45068159103393557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,power_law_1.01,2.6004287719726564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,1,8,power_law_1.2,4.536038589477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,8,power_law_1.01,7.2155906677246096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,power_law_1.2,0.4429056167602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,power_law_1.01,3.1734527587890624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,1,8,power_law_1.2,7.143756866455078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,power_law_1.2,0.45642881393432616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,8,power_law_1.01,13.856434631347657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,power_law_1.01,3.8437694549560546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,power_law_1.2,0.48100481033325193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,1,8,power_law_1.2,14.541349792480469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,power_law_1.2,0.5567679882049561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,power_law_1.01,5.863711929321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,power_law_1.2,0.6486720085144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,8,power_law_1.01,0.06233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,power_law_1.2,0.639296007156372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,power_law_1.01,11.213299560546876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,8,power_law_1.01,0.06254079937934875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,1,8,power_law_1.2,0.06056320071220398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,power_law_1.2,0.7519487857818603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,8,power_law_1.01,0.06152960062026978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,1,8,power_law_1.2,0.06466559767723083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,power_law_1.2,0.8232128143310546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,8,power_law_1.01,0.05864959955215454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,1,8,power_law_1.2,0.060153597593307497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,8,power_law_1.01,0.05864959955215454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,1,8,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,power_law_1.2,1.013702392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,8,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,1,8,power_law_1.2,0.05912960171699524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,power_law_1.2,1.2518783569335938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,8,power_law_1.01,0.05927039980888367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,1,8,power_law_1.2,0.060147202014923094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,8,power_law_1.01,0.0602944016456604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,1,8,power_law_1.2,0.061587202548980716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,power_law_1.2,1.594495964050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,4,power_law_1.01,0.028358399868011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,8,power_law_1.01,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,1,8,power_law_1.2,0.061587202548980716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,4,power_law_1.01,0.030195200443267824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,power_law_1.2,1.9809600830078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,8,power_law_1.01,0.0670527994632721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,1,8,power_law_1.2,0.0630016028881073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,4,power_law_1.01,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,8,power_law_1.01,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,1,8,power_law_1.2,0.06627200245857238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,power_law_1.2,2.6471744537353517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,4,power_law_1.01,0.030406400561332703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,1,8,power_law_1.2,0.06711680293083191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,8,power_law_1.01,0.07463679909706115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,4,power_law_1.01,0.030822399258613586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,1,8,power_law_1.2,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,power_law_1.2,3.182905578613281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,4,power_law_1.01,0.03961600065231323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,8,power_law_1.2,0.07304319739341736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,4,power_law_1.01,0.03592959940433502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,power_law_1.2,3.8790462493896483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,8,power_law_1.2,0.07651839852333069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,4,power_law_1.01,0.04126079976558685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,8,power_law_1.2,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,4,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,power_law_1.2,5.909222412109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,8,power_law_1.2,0.10479999780654907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,4,power_law_1.01,0.040428799390792844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,8,power_law_1.2,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,4,power_law_1.01,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,8,power_law_1.2,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,power_law_1.2,11.225228881835937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,4,power_law_1.01,0.05208960175514221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.2,0.1395840048789978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,4,power_law_1.01,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.2,0.19286400079727173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,4,power_law_1.01,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.2,0.21660161018371582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,4,power_law_1.01,0.07811200022697448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.2,0.31797759532928466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,4,power_law_1.01,0.09100800156593322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.2,0.4066688060760498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,4,power_law_1.01,0.10577280521392822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,4,power_law_1.01,0.12008960247039795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.2,0.6210944175720214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,4,power_law_1.01,0.17151360511779784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.2,0.783897590637207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,4,power_law_1.2,0.030444800853729248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,4,power_law_1.01,0.2286463975906372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.2,1.076972770690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,4,power_law_1.2,0.026956799626350402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,4,power_law_1.01,0.29909119606018064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.2,1.614156723022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,4,power_law_1.2,0.028403198719024657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,4,power_law_1.01,0.45389437675476074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,8,power_law_1.2,2.038297653198242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,4,power_law_1.2,0.030643200874328612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,4,power_law_1.01,0.6247231960296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,8,power_law_1.2,3.2820545196533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,4,power_law_1.2,0.031462401151657104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,4,power_law_1.01,0.8092479705810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,4,power_law_1.2,0.044563201069831845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,4,power_law_1.01,1.3316864013671874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,8,power_law_1.2,6.922783660888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,4,power_law_1.2,0.03535360097885132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,4,power_law_1.01,1.7398527145385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,4,power_law_1.2,0.03903360068798065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,4,power_law_1.01,2.8103359222412108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,4,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,4,power_law_1.01,2.902899169921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,4,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,4,power_law_1.2,0.05132160186767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,4,power_law_1.01,5.754342269897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,4,power_law_1.01,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,4,power_law_1.2,0.051532799005508424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,4,power_law_1.01,0.04991360008716583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,4,power_law_1.01,10.542368316650391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,4,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,4,power_law_1.01,0.051558399200439455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,4,power_law_1.2,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,4,power_law_1.01,0.05420799851417542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,4,power_law_1.2,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,4,power_law_1.01,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,4,power_law_1.2,0.08737919926643371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,4,power_law_1.01,0.05503360033035278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,4,power_law_1.2,0.10314240455627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,4,power_law_1.01,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,4,power_law_1.2,0.053324800729751584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,4,power_law_1.2,0.13835519552230835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,4,power_law_1.01,0.05380480289459229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,4,power_law_1.2,0.051910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,4,power_law_1.2,0.1686911940574646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,4,power_law_1.01,0.0546239972114563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,4,power_law_1.2,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,4,power_law_1.2,0.2493824005126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,4,power_law_1.01,0.06033920049667359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,4,power_law_1.2,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,4,power_law_1.2,0.373471999168396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,4,power_law_1.01,0.060147202014923094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,4,power_law_1.2,0.053548800945281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,4,power_law_1.2,0.6042880058288574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,4,power_law_1.01,0.06444799900054932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,4,power_law_1.2,0.05414400100708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,4,power_law_1.2,0.6169536113739014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,4,power_law_1.01,0.06729599833488464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,4,power_law_1.2,0.05496320128440857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,4,power_law_1.2,0.9792448043823242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,4,power_law_1.01,0.06752640008926392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,4,power_law_1.2,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,4,power_law_1.2,1.0806528091430665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,4,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,4,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,4,power_law_1.2,2.3571712493896486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,4,power_law_1.2,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,4,power_law_1.01,0.08225280046463013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,4,power_law_1.2,2.892736053466797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,4,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,4,power_law_1.01,0.09617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,4,power_law_1.2,0.0656063973903656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,4,power_law_1.01,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,4,power_law_1.2,3.845043182373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,4,power_law_1.2,0.06746879816055298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,4,power_law_1.01,0.12238719463348388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,4,power_law_1.2,5.663667297363281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,4,power_law_1.2,0.0748416006565094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,4,power_law_1.01,0.1592576026916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,4,power_law_1.2,0.08856959939002991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,4,power_law_1.01,0.16459519863128663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,4,power_law_1.2,9.794898986816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,4,power_law_1.2,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,4,power_law_1.01,0.2462847948074341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,4,power_law_1.2,0.09571840167045594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,4,power_law_1.01,0.31921279430389404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,4,power_law_1.2,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,4,power_law_1.01,0.42099838256835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,4,power_law_1.2,0.12912000417709352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,4,power_law_1.01,0.4978047847747803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,2,power_law_1.01,0.02101760059595108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,4,power_law_1.2,0.19177600145339965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,4,power_law_1.01,0.9256256103515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,2,power_law_1.01,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,4,power_law_1.2,0.19916160106658937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,4,power_law_1.01,1.1605440139770509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,2,power_law_1.01,0.02245119959115982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,4,power_law_1.2,0.2753472089767456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,4,power_law_1.01,1.2596223831176758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,2,power_law_1.01,0.021631999313831328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,4,power_law_1.2,0.3273600101470947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,4,power_law_1.01,1.7603904724121093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,2,power_law_1.01,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,4,power_law_1.2,0.47112321853637695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,2,power_law_1.01,0.031455999612808226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,4,power_law_1.2,0.6347455978393555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,4,power_law_1.01,4.776486587524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,2,power_law_1.01,0.030643200874328612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,4,power_law_1.2,0.8792896270751953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,2,power_law_1.01,0.032691198587417605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,4,power_law_1.2,1.2235584259033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,2,power_law_1.01,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,4,power_law_1.2,1.5338239669799805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,2,power_law_1.01,0.03351039886474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,4,power_law_1.2,2.9815616607666016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,2,power_law_1.2,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,2,power_law_1.01,0.03697920143604279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,2,power_law_1.2,0.021216000616550445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,2,power_law_1.01,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,4,power_law_1.2,6.532978820800781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,2,power_law_1.2,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,2,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,2,power_law_1.01,0.05130879878997803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,2,power_law_1.2,0.02083200067281723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,2,power_law_1.01,0.05848960280418396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,2,power_law_1.2,0.027161601185798644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,2,power_law_1.01,0.070169597864151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,2,power_law_1.2,0.03187839984893799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,2,power_law_1.01,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,2,power_law_1.2,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,2,power_law_1.01,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,2,power_law_1.01,0.10437120199203491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,2,power_law_1.2,0.032691198587417605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,2,power_law_1.01,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,2,power_law_1.01,0.13305599689483644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,2,power_law_1.2,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,2,power_law_1.01,0.044947201013565065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,2,power_law_1.01,0.18240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,2,power_law_1.2,0.03413119912147522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,2,power_law_1.01,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,2,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,2,power_law_1.01,0.23135359287261964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,2,power_law_1.01,0.052108800411224364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,2,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,2,power_law_1.01,0.3575103998184204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,2,power_law_1.01,0.0506816029548645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,2,power_law_1.2,0.05051519870758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,2,power_law_1.01,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,2,power_law_1.2,0.05011199712753296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,2,power_law_1.01,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,2,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,2,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,2,power_law_1.2,0.0810368001461029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,2,power_law_1.2,0.11012480258941651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,2,power_law_1.2,0.13877760171890258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,2,power_law_1.2,0.2014591932296753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,2,power_law_1.2,0.25961599349975584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,2,power_law_1.2,0.38188800811767576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,2,power_law_1.2,0.4982143878936768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,2,power_law_1.2,0.7376255989074707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,2,power_law_1.2,0.9760128021240234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,2,power_law_1.2,1.4640512466430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,2,power_law_1.2,1.9285312652587892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,2,power_law_1.2,2.4144704818725584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,2,power_law_1.2,3.83111686706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,2,power_law_1.2,7.66723861694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,2,power_law_1.2,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,2,power_law_1.2,0.042956799268722534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,2,power_law_1.2,0.045817598700523376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,2,power_law_1.2,0.05175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,2,power_law_1.2,0.05196160078048706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,2,power_law_1.2,0.05114240050315857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,2,power_law_1.2,0.05196160078048706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,2,power_law_1.2,0.051545602083206174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,2,power_law_1.2,0.05605760216712952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,2,power_law_1.2,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,2,power_law_1.2,0.05849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,2,power_law_1.2,0.06403840184211732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,2,power_law_1.2,0.067084801197052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,2,power_law_1.2,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,2,power_law_1.2,0.07652480006217957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,2,power_law_1.2,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,2,power_law_1.2,0.09062399864196777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,2,power_law_1.2,0.10068479776382447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,2,power_law_1.2,0.11094399690628051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,2,power_law_1.2,0.14328960180282593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,2,power_law_1.2,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,2,power_law_1.2,0.20964479446411133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,2,power_law_1.2,0.25102720260620115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,2,power_law_1.2,0.3787519931793213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,2,power_law_1.2,0.4457791805267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,2,power_law_1.2,0.6643072128295898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,2,power_law_1.2,0.8818047523498536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,2,power_law_1.2,1.0530176162719727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,2,power_law_1.2,1.8328960418701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,2,power_law_1.2,3.877004623413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,1,power_law_1.01,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,1,power_law_1.01,0.020000000298023225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,1,power_law_1.01,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,1,power_law_1.01,0.03127039968967438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,1,power_law_1.01,0.03308799862861633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,1,power_law_1.01,0.04163840115070343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,1,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,1,power_law_1.01,0.04328320026397705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,1,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,1,power_law_1.01,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,1,8,power_law_1.01,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,1,power_law_1.01,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,1,8,power_law_1.01,0.07729920148849487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,1,power_law_1.01,0.051551997661590576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,1,8,power_law_1.01,0.09591680169105529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,1,power_law_1.01,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,1,8,power_law_1.01,0.09468160271644592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,1,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,1,8,power_law_1.01,0.11436799764633179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,1,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,1,power_law_1.01,0.05544959902763367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,1,8,power_law_1.01,0.1364799976348877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,1,power_law_1.01,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.01,0.1377087950706482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,1,power_law_1.01,0.08022400140762329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.01,0.17128959894180298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.01,0.0949504017829895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.01,0.21879680156707765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.01,0.12833280563354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.01,0.3224447965621948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.01,0.1590656042098999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.01,0.393503999710083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.01,0.22213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.01,0.5636928081512451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.01,0.28584320545196534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.01,0.7457664012908936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.01,0.4111616134643555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.01,1.1494208335876466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.01,0.5350783824920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.01,1.5731391906738281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.01,0.790444803237915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,1,8,power_law_1.01,1.8842239379882812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.01,1.0415424346923827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,1,8,power_law_1.01,3.018828773498535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,1,power_law_1.01,1.3026304244995117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,1,8,power_law_1.01,6.867635345458984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,1,power_law_1.01,2.0538368225097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,1,power_law_1.01,4.068479919433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,1,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,1,power_law_1.2,0.01932799965143204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,1,power_law_1.2,0.018713599443435668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,1,power_law_1.01,0.0398719996213913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,1,power_law_1.2,0.01912959963083267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,1,power_law_1.01,0.042131200432777405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,1,power_law_1.2,0.021158400177955627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,1,power_law_1.01,0.04805760085582733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,1,power_law_1.2,0.02999039888381958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,1,power_law_1.01,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,1,power_law_1.2,0.029574400186538695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,1,power_law_1.01,0.055027198791503903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,1,power_law_1.2,0.03160960078239441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,1,power_law_1.01,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,1,power_law_1.2,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,1,power_law_1.01,0.056467199325561525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,1,power_law_1.2,0.03304960131645203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,1,power_law_1.01,0.05605120062828064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,1,power_law_1.2,0.03429119884967804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,1,power_law_1.01,0.05687680244445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,1,power_law_1.2,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,1,power_law_1.01,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,1,power_law_1.2,0.03878400027751923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,1,power_law_1.01,0.0581055998802185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,1,power_law_1.2,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,1,power_law_1.01,0.061382400989532473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,1,power_law_1.2,0.041043201088905336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,1,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,1,power_law_1.2,0.04924800097942352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,1,power_law_1.01,0.0654591977596283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,1,power_law_1.2,0.05251200199127197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,1,power_law_1.01,0.0750976026058197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,1,power_law_1.2,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,1,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.2,0.08321920037269592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,1,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.2,0.11743359565734864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,1,power_law_1.01,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.2,0.15450880527496338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.01,0.10888960361480712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.2,0.22371840476989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.01,0.1330623984336853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.2,0.27368319034576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.01,0.15619200468063354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.2,0.3990335941314697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.01,0.1985856056213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.2,0.5235455989837646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.01,0.23892478942871093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.2,0.7760640144348144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.01,0.32884480953216555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.2,1.0259200096130372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.01,0.41280641555786135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,1,power_law_1.2,1.2849984169006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.01,0.5858687877655029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,1,power_law_1.2,2.0464384078979494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.01,0.7568704128265381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,1,power_law_1.2,4.064326477050781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,1,power_law_1.01,0.9321855545043946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,1,power_law_1.01,1.4632320404052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,1,power_law_1.01,3.0037376403808596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,1,power_law_1.2,0.04042240083217621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,1,power_law_1.2,0.04287999868392944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,8,power_law_1.01,0.012627199292182922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,1,power_law_1.2,0.04575999975204468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,8,power_law_1.01,0.012831999361515046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,1,power_law_1.2,0.05374720096588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,8,power_law_1.01,0.012217599898576736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,1,power_law_1.2,0.0525056004524231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,8,power_law_1.01,0.014393599331378936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,1,power_law_1.2,0.052716797590255736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,8,power_law_1.01,0.013862399756908417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,1,power_law_1.2,0.05374079942703247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,8,power_law_1.01,0.016518400609493257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,1,power_law_1.2,0.05639680027961731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,8,power_law_1.01,0.014886400103569031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,1,power_law_1.2,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,8,power_law_1.01,0.017113600671291352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,1,power_law_1.2,0.055174398422241214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,8,power_law_1.01,0.014739200472831726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,1,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,8,power_law_1.01,0.014681600034236908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,1,power_law_1.2,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,8,power_law_1.01,0.01775359958410263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,1,power_law_1.2,0.06500480175018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,8,power_law_1.01,0.015296000242233276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,8,power_law_1.01,0.01530880033969879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,1,power_law_1.2,0.06746240258216858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,8,power_law_1.01,0.016729600727558136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,1,power_law_1.2,0.07790719866752624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,8,power_law_1.01,0.017958399653434754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,1,power_law_1.2,0.08119040131568908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,8,power_law_1.01,0.018777599930763243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,1,power_law_1.2,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,8,power_law_1.01,0.02205439954996109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,1,power_law_1.2,0.09797120094299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,8,power_law_1.01,0.025331199169158936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.2,0.10862720012664795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,2,power_law_1.01,0.4728064060211182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.01,0.02963840067386627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.2,0.13217920064926147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,2,power_law_1.01,0.6325568199157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.01,0.038649600744247434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.2,0.1530751943588257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,2,power_law_1.01,0.8936832427978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.2,0.1950271964073181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,2,power_law_1.01,1.2952511787414551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.01,0.06053760051727295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.2,0.23437440395355225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,2,power_law_1.01,1.7898431777954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.01,0.07508479952812194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.2,0.3208064079284668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,2,power_law_1.01,2.24389762878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.01,0.1084671974182129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.2,0.4064064025878906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,2,power_law_1.01,3.708256149291992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.01,0.14083839654922486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.2,0.5796671867370605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.01,0.20289919376373292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,2,power_law_1.01,6.900870513916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.2,0.7506688117980957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.01,0.26370561122894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,1,power_law_1.2,0.9243391990661621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,8,power_law_1.01,0.3249408006668091
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,1,power_law_1.2,1.466438388824463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,8,power_law_1.01,0.5100800037384033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,1,power_law_1.2,2.928716850280762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,1,8,power_law_1.2,0.012620800733566284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,8,power_law_1.01,0.9973055839538574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,1,8,power_law_1.2,0.012812800705432892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,1,8,power_law_1.2,0.013030399382114411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,1,8,power_law_1.2,0.012825599312782288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,1,8,power_law_1.2,0.01340160071849823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,1,8,power_law_1.2,0.01671680063009262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,1,8,power_law_1.2,0.014745600521564484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,8,power_law_1.01,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,1,8,power_law_1.2,0.0763264000415802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,1,8,power_law_1.2,0.016927999258041383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,8,power_law_1.2,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,1,8,power_law_1.01,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,1,8,power_law_1.2,0.015078400075435639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,8,power_law_1.2,0.0779583990573883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,1,8,power_law_1.01,0.0785215973854065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,1,8,power_law_1.2,0.015193599462509155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,8,power_law_1.2,0.07714560031890869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,1,8,power_law_1.01,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,1,8,power_law_1.2,0.01754239946603775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,8,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,1,8,power_law_1.01,0.07893760204315185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,1,8,power_law_1.2,0.015667200088500977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,8,power_law_1.2,0.07899519801139832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,1,8,power_law_1.01,0.07893120050430298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,1,8,power_law_1.2,0.01568640023469925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,8,power_law_1.2,0.07941120266914367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,1,8,power_law_1.2,0.01774719953536987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,8,power_law_1.2,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,1,8,power_law_1.2,0.01958400011062622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,8,power_law_1.2,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,1,8,power_law_1.2,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,1,8,power_law_1.2,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,1,8,power_law_1.2,0.025119999051094057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.2,0.029836800694465638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.2,0.04580479860305786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.2,0.060063999891281125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.2,0.1084671974182129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.2,0.1410431981086731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.2,0.20227839946746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.2,0.262662410736084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,1,8,power_law_1.2,0.32351999282836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,1,8,power_law_1.2,0.507212781906128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,1,8,power_law_1.2,0.9928000450134278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,4,power_law_1.01,0.031033599376678468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,4,power_law_1.01,0.0255295991897583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,4,power_law_1.01,0.031052801012992858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,4,power_law_1.01,0.025113600492477416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,4,power_law_1.01,0.03187200129032135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,4,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,4,power_law_1.01,0.040057599544525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,4,power_law_1.01,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,4,power_law_1.01,0.04655359983444214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,4,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,4,power_law_1.01,0.05763840079307556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,4,power_law_1.01,0.06437119841575623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,4,power_law_1.01,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,4,power_law_1.01,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,4,power_law_1.01,0.09863680005073547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,4,power_law_1.01,0.10929919481277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,4,power_law_1.01,0.13304959535598754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,4,power_law_1.01,0.19039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,4,power_law_1.01,0.25754880905151367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,4,power_law_1.01,0.343174409866333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,4,power_law_1.01,0.423033618927002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,4,power_law_1.01,0.6376448154449463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,4,power_law_1.01,0.8203647613525391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,4,power_law_1.01,1.2129599571228027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,4,power_law_1.01,1.8771263122558595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,4,power_law_1.01,2.764531135559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,4,power_law_1.01,3.9572799682617186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,4,power_law_1.01,4.743289566040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,4,power_law_1.01,6.333292770385742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,4,power_law_1.01,15.747219848632813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,4,power_law_1.2,0.035148799419403076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,4,power_law_1.2,0.03426559865474701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,4,power_law_1.2,0.031065601110458373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,4,power_law_1.2,0.02573440074920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,4,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,4,power_law_1.2,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,4,power_law_1.2,0.040057599544525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,4,power_law_1.2,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,4,power_law_1.2,0.042854401469230655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,4,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,4,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,4,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,4,power_law_1.2,0.06906239986419678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,4,power_law_1.2,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,4,power_law_1.2,0.10040960311889649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,4,power_law_1.2,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,4,power_law_1.2,0.14574719667434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,4,power_law_1.2,0.18957439661026002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,4,power_law_1.2,0.24405760765075685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,4,power_law_1.2,0.36980481147766114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,4,power_law_1.2,0.47404160499572756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,4,power_law_1.2,0.6206783771514892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,4,power_law_1.2,1.0601728439331055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,4,power_law_1.2,1.520364761352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,4,power_law_1.2,1.8804031372070313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,4,power_law_1.2,2.8120384216308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,4,power_law_1.2,4.265510559082031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,4,power_law_1.2,4.868844985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,4,power_law_1.2,8.167052459716796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,4,power_law_1.2,20.29877166748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,4,power_law_1.01,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,4,power_law_1.01,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,4,power_law_1.01,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,4,power_law_1.01,0.07037439942359924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,4,power_law_1.01,0.0713919997215271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,4,power_law_1.01,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,4,power_law_1.01,0.07244160175323486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,4,power_law_1.01,0.07342720031738281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,4,power_law_1.01,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,4,power_law_1.01,0.07468159794807434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,4,power_law_1.01,0.0744704008102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,4,power_law_1.01,0.07857919931411743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,4,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,4,power_law_1.01,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,4,power_law_1.01,0.10150400400161744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,4,power_law_1.01,0.10826239585876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,4,power_law_1.01,0.11910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,4,power_law_1.01,0.13735040426254272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,4,power_law_1.01,0.1580415964126587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,4,power_law_1.01,0.19775999784469606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,4,power_law_1.01,0.2514240026473999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,4,power_law_1.01,0.2936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,4,power_law_1.01,0.4347072124481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,2,power_law_1.01,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,4,power_law_1.01,0.6622591972351074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,2,power_law_1.01,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,4,power_law_1.01,0.7089471817016602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,2,power_law_1.01,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,2,power_law_1.01,0.06317440271377564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,4,power_law_1.01,1.1924736022949218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,2,power_law_1.01,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,4,power_law_1.01,1.7218816757202149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,2,power_law_1.01,0.07033600211143494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,4,power_law_1.01,1.8619583129882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,2,power_law_1.01,0.07669119834899903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,4,power_law_1.01,2.97259521484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,2,power_law_1.01,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,2,power_law_1.01,0.09265919923782348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,4,power_law_1.01,8.50772476196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,2,power_law_1.01,0.10290559530258178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,2,power_law_1.01,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,2,power_law_1.01,0.143449604511261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,2,power_law_1.01,0.16679680347442627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,2,power_law_1.01,0.22619519233703614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,2,power_law_1.01,0.27267839908599856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,2,power_law_1.01,0.3488703966140747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,4,power_law_1.2,0.07058560252189636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,2,power_law_1.01,0.4932544231414795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,4,power_law_1.2,0.06136959791183472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,4,power_law_1.2,0.0654591977596283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,2,power_law_1.01,0.6716351985931397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,4,power_law_1.2,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,2,power_law_1.01,0.8387328147888183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,4,power_law_1.2,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,2,power_law_1.01,1.025107192993164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,4,power_law_1.2,0.07284479737281799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,2,power_law_1.01,1.4899776458740235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,4,power_law_1.2,0.07242239713668823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,2,power_law_1.01,3.406099319458008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,4,power_law_1.2,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,4,power_law_1.2,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,4,power_law_1.2,0.07550079822540283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,4,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,4,power_law_1.2,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,4,power_law_1.2,0.08920959830284118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,2,power_law_1.01,0.022623999416828154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,1,8,power_law_1.01,0.07994880080223084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,2,power_law_1.01,0.022623999416828154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,1,8,power_law_1.01,0.08097919821739197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,2,power_law_1.01,0.02221439927816391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,1,8,power_law_1.01,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,8,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,2,power_law_1.01,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,1,8,power_law_1.01,0.08282880187034607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,8,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,2,power_law_1.01,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,1,8,power_law_1.01,0.08384640216827392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,8,power_law_1.2,0.08841599822044373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,2,power_law_1.01,0.03204480111598969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,8,power_law_1.2,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,2,power_law_1.01,0.031219199299812317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,8,power_law_1.2,0.10028159618377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,2,power_law_1.01,0.032864001393318173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,8,power_law_1.2,0.11073919534683227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,2,power_law_1.01,0.03223040103912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,8,power_law_1.2,0.1193343997001648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,2,power_law_1.01,0.03306879997253418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,8,power_law_1.2,0.14943360090255736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,2,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,8,power_law_1.2,0.2059648036956787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,2,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.2,0.18835840225219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,2,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.2,0.24956800937652587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,2,power_law_1.01,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.2,0.30836479663848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,2,power_law_1.01,0.0633791983127594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,2,power_law_1.01,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.2,0.45274882316589354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,2,power_law_1.01,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.2,0.5772672176361084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,2,power_law_1.01,0.10617599487304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.2,0.8420607566833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,2,power_law_1.01,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.2,1.116710376739502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,2,power_law_1.01,0.18421119451522827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.2,1.6923711776733399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,2,power_law_1.01,0.23129599094390868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.2,2.349401664733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,2,power_law_1.01,0.33350400924682616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,8,power_law_1.2,2.937785530090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,2,power_law_1.01,0.4404032230377197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,8,power_law_1.2,4.426278305053711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,2,power_law_1.01,0.6498496055603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,2,power_law_1.01,0.8539072036743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,8,power_law_1.2,10.673075103759766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,2,power_law_1.01,1.2690239906311036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,2,power_law_1.01,1.6952064514160157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,2,power_law_1.01,2.1068544387817383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,2,power_law_1.01,3.321343994140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,2,power_law_1.01,6.655072021484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,2,power_law_1.2,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,2,power_law_1.2,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,2,power_law_1.2,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,2,power_law_1.2,0.0212351992726326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,2,power_law_1.2,0.024505600333213806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,2,power_law_1.2,0.03147520124912262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,2,power_law_1.2,0.031065601110458373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,2,power_law_1.01,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,2,power_law_1.2,0.032915198802948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,2,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,2,power_law_1.2,0.03187839984893799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,2,power_law_1.01,0.0537663996219635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,2,power_law_1.2,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,2,power_law_1.01,0.07134720087051391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,2,power_law_1.2,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,2,power_law_1.01,0.0718720018863678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,2,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,2,power_law_1.01,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,2,power_law_1.01,0.07013760209083557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,2,power_law_1.2,0.04642559885978699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,2,power_law_1.01,0.07382400035858154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,2,power_law_1.2,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,2,power_law_1.01,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,2,power_law_1.2,0.06220160126686096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,2,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,2,power_law_1.2,0.06282240152359009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,2,power_law_1.01,0.07709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,2,power_law_1.2,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,2,power_law_1.01,0.08138239979743958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,2,power_law_1.2,0.10645760297775268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,2,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,2,power_law_1.2,0.13140480518341063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,2,power_law_1.01,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,2,power_law_1.2,0.18158719539642335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,2,power_law_1.01,0.09307519793510437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,2,power_law_1.2,0.2292992115020752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,2,power_law_1.01,0.10023679733276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,2,power_law_1.2,0.3376512050628662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,2,power_law_1.01,0.10248960256576538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,2,power_law_1.2,0.4388288021087646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,2,power_law_1.01,0.12645119428634644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,2,power_law_1.2,0.6483200073242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,2,power_law_1.01,0.14281599521636962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,2,power_law_1.2,0.863372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,2,power_law_1.01,0.18216960430145263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,2,power_law_1.2,1.2760319709777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,2,power_law_1.01,0.21042559146881104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,2,power_law_1.2,1.6948223114013672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,2,power_law_1.01,0.2812864065170288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,2,power_law_1.2,2.1169471740722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,2,power_law_1.01,0.3339200019836426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,2,power_law_1.01,0.5219264030456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,2,power_law_1.2,3.3657470703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,2,power_law_1.01,0.6413119792938232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,2,power_law_1.2,6.663718414306641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,2,power_law_1.01,0.8571136474609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,2,power_law_1.01,1.2821375846862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,2,power_law_1.01,1.689900779724121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,2,power_law_1.01,2.2106176376342774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,2,power_law_1.01,4.962118530273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,2,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,2,power_law_1.2,0.0515392005443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,2,power_law_1.2,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,2,power_law_1.2,0.0699072003364563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,2,power_law_1.2,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,2,power_law_1.2,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,1,power_law_1.01,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,2,power_law_1.2,0.07141759991645813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,1,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,2,power_law_1.2,0.07285119891166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,1,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,2,power_law_1.2,0.07386879920959473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,1,power_law_1.01,0.02139520049095154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,1,power_law_1.01,0.025484800338745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,2,power_law_1.2,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,1,power_law_1.01,0.0328575998544693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,2,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,1,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,2,power_law_1.2,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,1,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,2,power_law_1.2,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,1,power_law_1.01,0.037574398517608645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,2,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,1,power_law_1.01,0.038387200236320494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,2,power_law_1.2,0.09166719913482665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,1,power_law_1.01,0.03859840035438537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,2,power_law_1.2,0.09559680223464966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,1,power_law_1.01,0.04678399860858917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,2,power_law_1.2,0.1011072039604187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,1,power_law_1.01,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,2,power_law_1.2,0.1297727942466736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,1,power_law_1.01,0.049446401000022885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,2,power_law_1.2,0.14985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,1,power_law_1.01,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,2,power_law_1.2,0.18774399757385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,1,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,2,power_law_1.2,0.20718080997467042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,1,power_law_1.01,0.07935360074043274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,2,power_law_1.2,0.27948799133300783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,1,power_law_1.01,0.10617599487304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,2,power_law_1.2,0.3906879901885986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.01,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,2,power_law_1.2,0.4547904014587402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.01,0.18316800594329835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,2,power_law_1.2,0.6059264183044434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.01,0.2298815965652466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,2,power_law_1.2,0.8273216247558594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.01,0.3353280067443848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,2,power_law_1.2,1.3362175941467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.01,0.4326335906982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,2,power_law_1.2,1.409164810180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.01,0.6409088134765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,2,power_law_1.2,2.4933696746826173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.01,0.844480037689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.01,1.2632960319519042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,2,power_law_1.2,5.818265533447265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.01,1.6726783752441405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,1,power_law_1.01,2.0718271255493166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,1,power_law_1.01,3.298323059082031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,1,power_law_1.01,6.597286224365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,1,power_law_1.2,0.021638399362564086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,1,power_law_1.2,0.02328319996595383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,1,power_law_1.2,0.027379199862480164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,1,power_law_1.2,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,1,power_law_1.2,0.043558400869369504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,1,power_law_1.2,0.04928640127182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,1,power_law_1.01,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,1,power_law_1.2,0.04909439980983734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,1,power_law_1.01,0.04945279955863953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,1,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,1,power_law_1.01,0.049856001138687135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,1,power_law_1.2,0.051545602083206174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,1,power_law_1.01,0.07117440104484558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,1,power_law_1.2,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,1,power_law_1.01,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,1,power_law_1.2,0.0531711995601654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,1,power_law_1.01,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,1,power_law_1.2,0.05538560152053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,1,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,1,power_law_1.2,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,1,power_law_1.01,0.0732096016407013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,1,power_law_1.2,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,1,power_law_1.01,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,1,power_law_1.2,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,1,power_law_1.01,0.07586560249328614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,1,power_law_1.2,0.07263360023498536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,1,power_law_1.01,0.07956479787826538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,1,power_law_1.2,0.08697599768638611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,1,power_law_1.01,0.08018559813499451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,1,power_law_1.01,0.0840511977672577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,1,power_law_1.2,0.11256959438323974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,1,power_law_1.01,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.2,0.13715200424194335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,1,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.2,0.18753279447555543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,1,power_law_1.01,0.09921280145645142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.2,0.23749120235443116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,1,power_law_1.01,0.11437439918518066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.2,0.3403007984161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,1,power_law_1.01,0.12625279426574706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.2,0.4482304096221924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.01,0.14079359769821168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.2,0.6491456031799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.01,0.17007999420166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.2,0.8568127632141114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.01,0.19957120418548585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.2,1.268876838684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.01,0.25973761081695557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.2,1.6715072631835937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.01,0.31626238822937014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,1,power_law_1.2,2.084992027282715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.01,0.4330431938171387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,1,power_law_1.2,3.322604751586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.01,0.5493504047393799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.01,0.7834496021270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,1,power_law_1.2,6.56579818725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.01,1.0177472114562989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,1,power_law_1.01,1.2624832153320313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,4,power_law_1.2,0.09617279767990113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,1,power_law_1.01,2.0120319366455077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,4,power_law_1.2,0.1064255952835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,4,power_law_1.2,0.11482880115509034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,1,power_law_1.01,4.169599914550782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,4,power_law_1.2,0.11542400121688842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,4,power_law_1.2,0.14737919569015503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,1,power_law_1.2,0.043961599469184875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,4,power_law_1.2,0.16868480443954467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,1,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,4,power_law_1.2,0.20944640636444092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,1,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,1,8,power_law_1.01,0.08630399703979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,4,power_law_1.2,0.2944256067276001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,1,power_law_1.2,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,1,8,power_law_1.01,0.09326720237731934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,4,power_law_1.2,0.35423998832702636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,1,power_law_1.2,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,1,8,power_law_1.01,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,4,power_law_1.2,0.4437376022338867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,1,power_law_1.2,0.07264000177383423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,1,8,power_law_1.01,0.10697599649429321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,4,power_law_1.2,0.6544576168060303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,1,power_law_1.2,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,1,8,power_law_1.01,0.11722240447998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,4,power_law_1.2,0.7822527885437012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,1,power_law_1.2,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,1,8,power_law_1.01,0.13074560165405275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,4,power_law_1.2,1.3513919830322265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,1,power_law_1.2,0.07304319739341736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,1,8,power_law_1.01,0.16269439458847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,4,power_law_1.2,1.7091903686523438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,1,power_law_1.2,0.07222399711608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,8,power_law_1.01,0.052716797590255736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.01,0.18520959615707397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,1,power_law_1.2,0.07571200132369996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,4,power_law_1.2,2.1374271392822264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,8,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.01,0.25892479419708253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,1,power_law_1.2,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,4,power_law_1.2,3.4082111358642577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.01,0.32858240604400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,8,power_law_1.01,0.05682560205459595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,1,power_law_1.2,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.01,0.434662389755249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,8,power_law_1.01,0.06788480281829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,1,power_law_1.2,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,4,power_law_1.2,8.764749145507812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.01,0.5800511837005615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,1,power_law_1.2,0.09536640048027038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,8,power_law_1.01,0.09326080083847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.01,0.8735360145568848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,1,power_law_1.2,0.09822720289230347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,8,power_law_1.01,0.09818879961967468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.01,1.1137920379638673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,1,power_law_1.2,0.10786559581756591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,8,power_law_1.01,0.11580159664154052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,1,power_law_1.2,0.1268928050994873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.01,1.573964786529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.2,0.13941119909286498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,8,power_law_1.01,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.01,2.177510452270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.2,0.16888320446014404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,8,power_law_1.01,0.12665599584579468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,1,8,power_law_1.01,2.9717248916625976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.2,0.1969599962234497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,8,power_law_1.01,0.13790080547332764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,1,8,power_law_1.01,4.849139022827148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,8,power_law_1.2,0.029420799016952513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.2,0.25919361114501954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.2,0.3108288049697876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,8,power_law_1.01,0.15368319749832154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,8,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,1,8,power_law_1.01,10.405158233642577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.2,0.43061118125915526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,8,power_law_1.01,0.17929600477218627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,8,power_law_1.2,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.2,0.5448959827423095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,8,power_law_1.01,0.18175359964370727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,8,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.2,0.7802303791046142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,8,power_law_1.01,0.22311680316925048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.2,1.0161472320556642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,8,power_law_1.2,0.05316479802131653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,1,power_law_1.2,1.2629119873046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,8,power_law_1.2,0.06198400259017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,8,power_law_1.01,0.18480639457702636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,1,power_law_1.2,2.0198848724365233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,8,power_law_1.01,0.1940287947654724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,8,power_law_1.01,0.09940479993820191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,1,power_law_1.2,4.202419281005859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,8,power_law_1.01,0.14057600498199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,8,power_law_1.01,0.2435839891433716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,8,power_law_1.01,0.2155456066131592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,8,power_law_1.01,0.10227839946746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.01,0.2554624080657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,8,power_law_1.01,0.09488639831542969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.01,0.3631999969482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,8,power_law_1.01,0.12009600400924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.01,0.4188992023468018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,8,power_law_1.01,0.13258880376815796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,8,power_law_1.2,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.01,0.6017983913421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,8,power_law_1.01,0.16678400039672853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,8,power_law_1.2,0.1383679986000061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.01,0.7379903793334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,8,power_law_1.01,0.17252479791641234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,8,power_law_1.2,0.0841152012348175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.01,1.0900351524353027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,8,power_law_1.01,0.17416319847106934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,8,power_law_1.2,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,8,power_law_1.01,0.18153599500656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.01,1.3202367782592774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,8,power_law_1.2,0.110316801071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,8,power_law_1.01,0.17887359857559204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,8,power_law_1.2,0.12363519668579101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.01,2.1205631256103517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,8,power_law_1.01,0.18235520124435425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,8,power_law_1.2,0.1600767970085144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.01,2.636057662963867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,8,power_law_1.01,0.18788479566574096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,8,power_law_1.2,0.1686784029006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,8,power_law_1.01,3.66192626953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,8,power_law_1.01,0.19137279987335204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,8,power_law_1.2,0.17196160554885864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,8,power_law_1.01,5.5517822265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,8,power_law_1.2,0.16889599561691285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,8,power_law_1.01,0.20570240020751954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,8,power_law_1.2,0.17505279779434205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,8,power_law_1.01,0.2089792013168335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,8,power_law_1.01,11.607520294189452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,8,power_law_1.2,0.18957439661026002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,8,power_law_1.01,0.21511681079864503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,8,power_law_1.2,0.18547199964523314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,8,power_law_1.01,0.2325376033782959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,8,power_law_1.2,0.19572479724884034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.01,0.25854079723358153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,8,power_law_1.2,0.19900159835815429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.01,0.29908480644226076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,8,power_law_1.2,0.21804800033569335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.01,0.315065598487854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,8,power_law_1.2,0.22438399791717528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.01,0.39185919761657717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,8,power_law_1.2,0.24732160568237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,4,power_law_1.01,0.03203839957714081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.01,0.4506368160247803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.2,0.26331520080566406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,4,power_law_1.01,0.0584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.01,0.5751488208770752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.2,0.31571838855743406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,4,power_law_1.01,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.01,0.7162816047668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.2,0.3415424108505249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,4,power_law_1.01,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.01,0.9673407554626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.2,0.40380158424377444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,4,power_law_1.01,0.09185919761657715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.01,1.3062848091125487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,4,power_law_1.01,0.09225599765777588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.2,0.48019838333129883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,8,power_law_1.01,1.497760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,4,power_law_1.01,0.11557120084762573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.2,0.6753664016723633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,4,power_law_1.01,0.12215679883956909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.2,0.8023296356201172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,8,power_law_1.01,2.4521535873413085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,4,power_law_1.01,0.12051199674606324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.2,1.1306367874145509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,8,power_law_1.01,4.6744384765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,4,power_law_1.01,0.12461440563201905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.2,1.338700771331787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,4,power_law_1.01,0.1344383955001831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,8,power_law_1.2,1.8935039520263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,4,power_law_1.01,0.14222079515457153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,8,power_law_1.2,2.5644224166870115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,4,power_law_1.01,0.16147840023040771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,4,power_law_1.01,0.1844159960746765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,8,power_law_1.2,6.47509765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,4,power_law_1.01,0.15815680027008056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,4,power_law_1.01,0.17568639516830445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,4,power_law_1.2,0.032441601157188416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,4,power_law_1.01,0.1942463994026184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,4,power_law_1.2,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,4,power_law_1.01,0.194649600982666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,4,power_law_1.2,0.043699198961257936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,4,power_law_1.01,0.22148480415344238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,4,power_law_1.2,0.06726400256156921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,4,power_law_1.01,0.29171841144561766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,4,power_law_1.01,0.08369280099868774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,4,power_law_1.2,0.08895999789237977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,4,power_law_1.01,0.376313591003418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,4,power_law_1.01,0.11030399799346924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,4,power_law_1.01,0.47031679153442385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,4,power_law_1.2,0.0850816011428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,4,power_law_1.01,0.0865664005279541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,4,power_law_1.2,0.11886080503463745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,4,power_law_1.01,0.5960512161254883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,4,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,4,power_law_1.2,0.12460160255432129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,4,power_law_1.01,0.13059200048446656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,4,power_law_1.01,0.846720027923584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,4,power_law_1.01,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,4,power_law_1.2,0.1217344045639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,4,power_law_1.01,1.131392002105713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,4,power_law_1.01,0.18978559970855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,4,power_law_1.2,0.12993279695510865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,4,power_law_1.01,1.678009605407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,4,power_law_1.01,0.20023679733276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,4,power_law_1.2,0.14342399835586547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,4,power_law_1.01,2.098464012145996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,4,power_law_1.01,0.19285759925842286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,4,power_law_1.2,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,4,power_law_1.01,2.5754367828369142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,4,power_law_1.01,0.2041088104248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,4,power_law_1.2,0.17087359428405763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,4,power_law_1.01,4.087270355224609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,4,power_law_1.01,0.21210880279541017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,4,power_law_1.2,0.19997440576553344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,4,power_law_1.01,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,4,power_law_1.2,0.16883200407028198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,4,power_law_1.01,7.986867523193359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,4,power_law_1.01,0.21907200813293456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,4,power_law_1.2,0.18418560028076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,4,power_law_1.01,0.22191998958587647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,4,power_law_1.2,0.216377592086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,4,power_law_1.01,0.2309567928314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,4,power_law_1.2,0.20304639339447023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,4,power_law_1.01,0.24158720970153807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,4,power_law_1.2,0.23867518901824952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,4,power_law_1.01,0.26146559715270995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,4,power_law_1.2,0.31300480365753175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,4,power_law_1.2,0.0834496021270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,4,power_law_1.01,0.27640318870544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,4,power_law_1.2,0.38835840225219725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,4,power_law_1.2,0.11313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,4,power_law_1.01,0.3132607936859131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,4,power_law_1.2,0.5206783771514892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,4,power_law_1.2,0.07953919768333435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,4,power_law_1.01,0.36837120056152345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,4,power_law_1.2,0.674892807006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,4,power_law_1.2,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,4,power_law_1.01,0.3755264043807983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,4,power_law_1.2,0.9792384147644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,4,power_law_1.2,0.11683199405670167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,4,power_law_1.01,0.4556096076965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,4,power_law_1.2,1.2063551902770997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,4,power_law_1.2,0.13341439962387086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,4,power_law_1.01,0.5547455787658692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,4,power_law_1.2,1.7333120346069335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,4,power_law_1.2,0.1819584012031555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,4,power_law_1.01,0.6900991916656494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,4,power_law_1.2,2.2704896926879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,4,power_law_1.2,0.18906240463256835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,4,power_law_1.01,0.8334591865539551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,4,power_law_1.2,2.8312320709228516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,4,power_law_1.2,0.19791359901428224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,4,power_law_1.01,1.1535743713378905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,4,power_law_1.2,4.446675109863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,4,power_law_1.2,0.20325760841369628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,4,power_law_1.01,1.4920960426330567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,4,power_law_1.2,0.21267199516296387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,4,power_law_1.01,1.7874303817749024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,4,power_law_1.2,9.755513763427734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,4,power_law_1.2,0.2163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,4,power_law_1.01,2.8665088653564452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,4,power_law_1.2,0.21532158851623534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,4,power_law_1.2,0.2302720069885254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,4,power_law_1.01,5.283967971801758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,4,power_law_1.2,0.23348479270935057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,4,power_law_1.2,0.2485055923461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,2,power_law_1.01,0.022809599339962006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,4,power_law_1.2,0.26856958866119385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,2,power_law_1.01,0.026700800657272337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,4,power_law_1.2,0.3005183935165405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,2,power_law_1.01,0.029151999950408937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,4,power_law_1.2,0.31630079746246337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,2,power_law_1.2,0.02245119959115982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,2,power_law_1.01,0.0500544011592865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,4,power_law_1.2,0.37385599613189696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,2,power_law_1.2,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,2,power_law_1.01,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,2,power_law_1.2,0.024102400243282317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,4,power_law_1.2,0.39638400077819824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,2,power_law_1.01,0.08834559917449951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,2,power_law_1.2,0.0286080002784729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,4,power_law_1.2,0.47849597930908205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,2,power_law_1.2,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,4,power_law_1.2,0.5542784214019776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,2,power_law_1.2,0.05175679922103882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,4,power_law_1.2,0.6953855991363526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,2,power_law_1.2,0.06220160126686096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,4,power_law_1.2,0.902131175994873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,2,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,4,power_law_1.2,1.237484836578369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,2,power_law_1.2,0.08083199858665466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,4,power_law_1.2,1.5727168083190919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,2,power_law_1.2,0.08920320272445678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,4,power_law_1.2,1.9669759750366211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,2,power_law_1.2,0.10497920513153076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,2,power_law_1.2,0.10826239585876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,4,power_law_1.2,2.935628890991211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,2,power_law_1.2,0.12095359563827515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,2,power_law_1.2,0.14678399562835692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,4,power_law_1.2,5.988639831542969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,2,power_law_1.2,0.11871999502182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,2,power_law_1.2,0.13256959915161132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,2,power_law_1.2,0.1615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,2,power_law_1.2,0.1509951949119568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,2,power_law_1.2,0.18345600366592407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,2,power_law_1.2,0.24501121044158936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,2,power_law_1.2,0.32065279483795167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,2,power_law_1.01,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,2,power_law_1.2,0.4482367992401123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,2,power_law_1.01,0.0998207986354828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,2,power_law_1.2,0.5866879940032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,2,power_law_1.01,0.09840000271797181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,2,power_law_1.01,0.11437439918518066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,2,power_law_1.2,0.8653951644897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,8,power_law_1.2,0.06627200245857238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,2,power_law_1.01,0.14755200147628783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,2,power_law_1.2,1.1011391639709474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,2,power_law_1.01,0.19158400297164918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,8,power_law_1.2,0.08000640273094177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,2,power_law_1.2,1.7190271377563477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,2,power_law_1.01,0.23192958831787108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,8,power_law_1.2,0.09331200122833253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,2,power_law_1.2,2.2455680847167967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,2,power_law_1.01,0.24462080001831055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,8,power_law_1.2,0.10562560558319092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,2,power_law_1.2,2.8689727783203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,2,power_law_1.01,0.25077118873596194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,8,power_law_1.2,0.13181439638137818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,2,power_law_1.2,4.425043106079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,2,power_law_1.01,0.2577343940734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,8,power_law_1.2,0.15905280113220216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,2,power_law_1.01,0.2757567882537842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,8,power_law_1.2,0.1852671980857849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,2,power_law_1.2,8.699635314941407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,2,power_law_1.01,0.27433600425720217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,8,power_law_1.2,0.2352447986602783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,2,power_law_1.01,0.2773823976516724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,8,power_law_1.2,0.1678655982017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,2,power_law_1.01,0.2841536045074463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,8,power_law_1.2,0.19530880451202393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,2,power_law_1.01,0.3054527997970581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,8,power_law_1.2,0.2518336057662964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,2,power_law_1.01,0.2988991975784302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,8,power_law_1.2,0.20636160373687745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.2,0.2628864049911499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,2,power_law_1.01,0.34209280014038085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,2,power_law_1.2,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.2,0.38536319732666013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,2,power_law_1.01,0.37119359970092775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,2,power_law_1.2,0.09168639779090881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,2,power_law_1.01,0.4121535778045654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.2,0.49943041801452637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,2,power_law_1.2,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,2,power_law_1.01,0.46456317901611327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.2,0.7404736042022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,2,power_law_1.2,0.11626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,2,power_law_1.01,0.5055871963500976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.2,0.9788736343383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,2,power_law_1.2,0.13284480571746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,2,power_law_1.01,0.6226560115814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.2,1.4603327751159667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,2,power_law_1.2,0.1678655982017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,2,power_law_1.01,0.7097152233123779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.2,1.9440895080566407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,2,power_law_1.2,0.22992000579833985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,2,power_law_1.01,0.9337663650512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.2,2.9017343521118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,2,power_law_1.2,0.24343039989471435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,2,power_law_1.01,1.1105152130126954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,2,power_law_1.2,0.24569599628448485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.2,3.858143997192383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,2,power_law_1.01,1.5825663566589356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,2,power_law_1.2,0.2612607955932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,8,power_law_1.2,4.8043262481689455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,2,power_law_1.2,0.2637120008468628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,2,power_law_1.01,2.000569534301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,8,power_law_1.2,7.679494476318359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,2,power_law_1.2,0.28092160224914553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,2,power_law_1.01,2.4152191162109373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,2,power_law_1.2,0.285427188873291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,2,power_law_1.01,3.7073665618896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,8,power_law_1.2,15.345805358886718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,2,power_law_1.2,0.28888959884643556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,2,power_law_1.2,0.3145087957382202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,2,power_law_1.01,7.12713623046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,2,power_law_1.2,0.3190144062042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,2,power_law_1.2,0.34685440063476564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,1,power_law_1.01,0.021427200734615327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,2,power_law_1.2,0.3761600017547607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,1,power_law_1.01,0.02223999947309494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,1,power_law_1.2,0.022419199347496033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,2,power_law_1.2,0.42568321228027345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,1,power_law_1.01,0.02327679991722107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,1,power_law_1.2,0.024646399915218352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,2,power_law_1.2,0.4855231761932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,1,power_law_1.2,0.02773120105266571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,2,power_law_1.2,0.509280014038086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,1,power_law_1.2,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,2,power_law_1.2,0.6288832187652588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,1,power_law_1.2,0.06991360187530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,2,power_law_1.2,0.7159167766571045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,1,power_law_1.2,0.08446080088615418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,2,power_law_1.2,0.962502384185791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,1,power_law_1.2,0.1051584005355835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,2,power_law_1.2,1.2375424385070801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,1,power_law_1.2,0.11763199567794799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,2,power_law_1.2,1.6833919525146483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,1,power_law_1.2,0.12666239738464355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,2,power_law_1.2,2.122265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,1,power_law_1.2,0.13054720163345337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,2,power_law_1.2,2.4755584716796877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,1,power_law_1.2,0.1475391983985901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,1,power_law_1.2,0.1606592059135437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,2,power_law_1.2,4.050060653686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,1,power_law_1.2,0.17089920043945311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,1,power_law_1.2,0.1934272050857544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,2,power_law_1.2,8.272601318359374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,1,power_law_1.2,0.1754047989845276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,1,power_law_1.2,0.18830080032348634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,1,power_law_1.2,0.21225600242614745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,1,power_law_1.2,0.21921920776367188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.2,0.2546560049057007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.2,0.29786880016326905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.2,0.3449215888977051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.2,0.42955517768859863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.2,0.5305088043212891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,1,power_law_1.01,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.2,0.7142271995544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,1,power_law_1.01,0.10069760084152221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.2,0.9059264183044433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,1,power_law_1.01,0.11789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.2,1.2919551849365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,1,power_law_1.01,0.15864959955215455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.2,1.6640832901000977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,1,power_law_1.01,0.2006335973739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,1,power_law_1.2,2.04849910736084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,1,power_law_1.01,0.2454848051071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,1,power_law_1.01,0.3288511991500854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,1,power_law_1.2,3.1832319259643556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,1,power_law_1.01,0.350547194480896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,1,power_law_1.2,6.228051376342774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,1,power_law_1.01,0.358732795715332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,1,power_law_1.01,0.37185280323028563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,1,power_law_1.01,0.38496639728546145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,1,power_law_1.01,0.4016831874847412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,1,power_law_1.01,0.3970367908477783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,1,power_law_1.01,0.4103551864624023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,1,power_law_1.01,0.42570881843566893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,1,power_law_1.01,0.44537601470947263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,1,power_law_1.01,0.4756800174713135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,1,power_law_1.01,0.5428607940673829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.01,0.5887360095977783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,1,power_law_1.2,0.09634559750556945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.01,0.6983104228973389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,1,power_law_1.2,0.10432640314102173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.01,0.7535999774932861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,1,power_law_1.2,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.01,0.943667221069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,1,power_law_1.2,0.15166079998016357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,1,power_law_1.2,0.18339200019836427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.01,1.0863936424255372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,1,power_law_1.2,0.22721920013427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.01,1.4255423545837402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,1,power_law_1.2,0.3296191930770874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.01,1.7640064239501954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,1,power_law_1.2,0.3445631980895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.01,2.427212715148926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,1,power_law_1.2,0.35992319583892823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.01,3.1163711547851562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,1,power_law_1.2,0.36894080638885496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,1,power_law_1.01,3.8106494903564454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,1,power_law_1.2,0.39166719913482667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,2,power_law_1.01,0.11149439811706544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,1,power_law_1.2,0.40476160049438475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,1,power_law_1.01,5.81214714050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,2,power_law_1.01,0.11825920343399048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,1,power_law_1.2,0.4211711883544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,2,power_law_1.01,0.12828799486160278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,1,power_law_1.2,0.45802879333496094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,1,power_law_1.01,11.417670440673827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,1,power_law_1.2,0.44858880043029786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,2,power_law_1.01,0.13177599906921386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,1,power_law_1.2,0.4871103763580322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,2,power_law_1.01,0.1450816035270691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,1,power_law_1.2,0.49692158699035643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,2,power_law_1.01,0.1446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,1,power_law_1.2,0.5661632061004639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,2,power_law_1.01,0.15448960065841674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,8,power_law_1.01,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.2,0.609990406036377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,2,power_law_1.01,0.17498879432678222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,8,power_law_1.01,0.023897600173950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.2,0.71463041305542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,2,power_law_1.01,0.1538879990577698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,8,power_law_1.01,0.026144000887870788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,2,power_law_1.01,0.16637439727783204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.2,0.7727935791015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,8,power_law_1.01,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,2,power_law_1.01,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.2,0.9521920204162597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,8,power_law_1.01,0.039238399267196654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,2,power_law_1.01,0.18889600038528442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.2,1.0932991981506348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,8,power_law_1.01,0.04950399994850159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,8,power_law_1.01,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,2,power_law_1.01,0.2184000015258789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.2,1.4430335998535155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,8,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,2,power_law_1.01,0.28474879264831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.2,1.7668928146362304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,8,power_law_1.01,0.05605120062828064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,2,power_law_1.01,0.3470016002655029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.2,2.446828842163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,8,power_law_1.01,0.06033920049667359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,2,power_law_1.01,0.44940800666809083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,8,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.2,3.109676742553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,2,power_law_1.01,0.5530303955078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,8,power_law_1.01,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,1,power_law_1.2,3.786220932006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,8,power_law_1.01,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,2,power_law_1.01,0.7781119823455811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,8,power_law_1.01,0.07182080149650574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,1,power_law_1.2,5.8604286193847654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,2,power_law_1.01,0.9509696006774903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,8,power_law_1.01,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,2,power_law_1.01,1.493280029296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,8,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,1,power_law_1.2,11.555532836914063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,8,power_law_1.01,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,2,power_law_1.01,1.7955520629882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,8,power_law_1.01,0.1047808051109314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,2,power_law_1.01,2.2684352874755858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.01,0.12117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.01,0.15333759784698486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,2,power_law_1.01,3.606131362915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.01,0.1946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,8,power_law_1.2,0.027929601073265076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.01,0.28970239162445066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,2,power_law_1.01,7.223385620117187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,8,power_law_1.2,0.023027199506759643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.01,0.3595583915710449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,8,power_law_1.2,0.027539199590682982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.01,0.5739776134490967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,8,power_law_1.2,0.03081600069999695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.01,0.6958271980285644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,8,power_law_1.2,0.03694719970226288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,8,power_law_1.01,0.05619199872016907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.01,1.0892607688903808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,8,power_law_1.2,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,8,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,8,power_law_1.2,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.01,1.531007957458496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,8,power_law_1.01,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,8,power_law_1.2,0.05374720096588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,8,power_law_1.01,1.9100992202758789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,8,power_law_1.01,0.05475199818611145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,8,power_law_1.2,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,8,power_law_1.01,3.235763168334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,8,power_law_1.01,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,8,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,8,power_law_1.01,0.07155839800834655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,8,power_law_1.2,0.06909440159797668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,8,power_law_1.01,5.521542358398437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,8,power_law_1.01,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,8,power_law_1.2,0.060102397203445436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,8,power_law_1.01,0.0742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,8,power_law_1.2,0.06398720145225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,8,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,8,power_law_1.01,0.07504000067710877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,8,power_law_1.2,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,8,power_law_1.01,0.07505279779434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,8,power_law_1.2,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,8,power_law_1.2,0.06993920207023621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,8,power_law_1.01,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,8,power_law_1.2,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,8,power_law_1.2,0.08078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,8,power_law_1.01,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,8,power_law_1.2,0.04683519899845123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,8,power_law_1.2,0.11250560283660889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,8,power_law_1.01,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,8,power_law_1.2,0.05113599896430969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.2,0.13116159439086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,8,power_law_1.01,0.07995520234107971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,8,power_law_1.2,0.055232000350952146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.2,0.18440959453582764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,8,power_law_1.01,0.08958079814910888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,8,power_law_1.2,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.2,0.22024960517883302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,8,power_law_1.01,0.09223679900169372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,8,power_law_1.2,0.07325440049171447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.2,0.3054464101791382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,8,power_law_1.01,0.09612799882888794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,8,power_law_1.2,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.2,0.4240128040313721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,8,power_law_1.01,0.11026560068130493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,8,power_law_1.2,0.07491199970245362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.2,0.6347583770751953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,8,power_law_1.2,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.01,0.11189759969711303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,8,power_law_1.2,0.07816960215568543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.2,0.8911744117736816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.01,0.13565440177917482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,8,power_law_1.2,0.07858560085296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.01,0.15982719659805297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.2,1.2264384269714355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,8,power_law_1.2,0.07982720136642456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.01,0.1878592014312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.2,1.7288127899169923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,8,power_law_1.2,0.08287360072135926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.01,0.24809598922729492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,8,power_law_1.2,2.1488447189331055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,8,power_law_1.2,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.01,0.30974080562591555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,8,power_law_1.2,3.4712383270263674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,8,power_law_1.2,0.095769602060318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.01,0.3830399990081787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,1,power_law_1.01,0.02839039862155914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,8,power_law_1.2,0.10437120199203491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.01,0.5002048015594482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,8,power_law_1.2,6.946482849121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,1,power_law_1.01,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,8,power_law_1.2,0.11585919857025147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.01,0.7006656169891358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,1,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.2,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,8,power_law_1.01,0.9059007644653321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.2,0.1455423951148987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,1,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.2,0.17299840450286866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,1,power_law_1.01,0.07303680181503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,8,power_law_1.01,1.4602944374084472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,4,power_law_1.01,0.023443199694156647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.2,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,1,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,4,power_law_1.01,0.023852799832820893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,8,power_law_1.01,2.668000030517578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.2,0.29173119068145753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,1,power_law_1.01,0.08592000007629394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,4,power_law_1.01,0.029555198550224305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.2,0.35054080486297606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,4,power_law_1.01,0.03592320084571839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,1,power_law_1.01,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.2,0.4916543960571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,4,power_law_1.01,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,1,power_law_1.01,0.110316801071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,4,power_law_1.01,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.2,0.6487360000610352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,1,power_law_1.01,0.12199679613113404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,4,power_law_1.2,0.023020799458026885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,4,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.2,0.9063743591308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,1,power_law_1.01,0.1449280023574829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,4,power_law_1.2,0.022393600642681123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,4,power_law_1.01,0.05538560152053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,8,power_law_1.2,0.9903360366821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,1,power_law_1.01,0.11973760128021241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,4,power_law_1.2,0.02956799864768982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,4,power_law_1.01,0.05989760160446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,4,power_law_1.2,0.035308799147605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,1,power_law_1.01,0.1338688015937805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,4,power_law_1.01,0.065830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,8,power_law_1.2,1.8845056533813476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,4,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,4,power_law_1.01,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,1,power_law_1.01,0.16069120168685913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,8,power_law_1.2,4.3216064453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,4,power_law_1.2,0.061337602138519284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,4,power_law_1.01,0.06520959734916687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,1,power_law_1.01,0.15763200521469117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,4,power_law_1.2,0.051686400175094606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,4,power_law_1.01,0.07054719924926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.01,0.1899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,4,power_law_1.2,0.05800960063934326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,4,power_law_1.01,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.01,0.20760319232940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,4,power_law_1.01,0.0736191987991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,4,power_law_1.2,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.01,0.2563071966171265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,4,power_law_1.01,0.048665601015090945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,4,power_law_1.01,0.07968639731407165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,4,power_law_1.2,0.06664320230484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.01,0.3472512006759644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,4,power_law_1.01,0.048691201210021975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,4,power_law_1.01,0.07217919826507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,4,power_law_1.2,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.01,0.4375807762145996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,4,power_law_1.01,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,4,power_law_1.01,0.09101439714431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,4,power_law_1.2,0.06664320230484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,4,power_law_1.01,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.01,0.6333568096160889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,4,power_law_1.01,0.10167039632797241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,4,power_law_1.2,0.07278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,4,power_law_1.01,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,4,power_law_1.01,0.13626879453659058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.01,0.8207615852355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,4,power_law_1.2,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,4,power_law_1.01,0.08186240196228027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,4,power_law_1.01,0.16720000505447388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,4,power_law_1.2,0.07420799732208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.01,1.1928959846496583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,4,power_law_1.01,0.08799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,4,power_law_1.01,0.22967679500579835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,4,power_law_1.2,0.08363519906997681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.01,1.584665584564209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,4,power_law_1.01,0.08391039967536926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,4,power_law_1.01,0.3025727987289429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,4,power_law_1.2,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,4,power_law_1.01,0.09106559753417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,1,power_law_1.01,1.9637567520141601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,4,power_law_1.01,0.40025601387023924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,4,power_law_1.2,0.09264640212059021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,4,power_law_1.01,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,4,power_law_1.01,0.5403456211090087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,4,power_law_1.2,0.10698239803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,1,power_law_1.01,3.109401512145996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,4,power_law_1.01,0.08984320163726807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,4,power_law_1.01,0.8387519836425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,4,power_law_1.2,0.1407807946205139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,4,power_law_1.01,0.09189760088920593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,4,power_law_1.2,0.17148799896240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,1,power_law_1.01,6.148646545410156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,4,power_law_1.01,1.1117312431335449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,4,power_law_1.01,0.09169279932975768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,4,power_law_1.2,0.24789121150970458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,4,power_law_1.01,1.30383358001709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,4,power_law_1.01,0.09575679898262024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,4,power_law_1.2,0.30071680545806884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,4,power_law_1.01,2.339116859436035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,4,power_law_1.01,0.10436480045318604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,4,power_law_1.2,0.4449024200439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,4,power_law_1.01,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,4,power_law_1.2,0.05583360195159912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,4,power_law_1.2,0.5948095798492432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,4,power_law_1.01,4.364166259765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,4,power_law_1.01,0.11257599592208863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,4,power_law_1.2,0.04394879937171936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,4,power_law_1.2,0.9521856307983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,4,power_law_1.01,0.13182079792022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,4,power_law_1.2,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,4,power_law_1.2,1.1576000213623048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,4,power_law_1.01,0.13898240327835082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,4,power_law_1.2,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,4,power_law_1.01,0.16908799409866332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,4,power_law_1.2,1.436953639984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,2,power_law_1.01,0.0201664000749588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,4,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,4,power_law_1.01,0.18303359746932985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,2,power_law_1.01,0.01995519995689392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,4,power_law_1.2,0.08510720133781433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,4,power_law_1.2,2.525676727294922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,4,power_law_1.01,0.23423359394073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,2,power_law_1.01,0.024051199853420257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,4,power_law_1.2,0.08632959723472595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,4,power_law_1.2,4.4034881591796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,2,power_law_1.01,0.02754560112953186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,4,power_law_1.01,0.2655616044998169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,4,power_law_1.2,0.0914687991142273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,2,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,4,power_law_1.01,0.37306239604949953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,4,power_law_1.2,0.09125760197639465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,2,power_law_1.01,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,4,power_law_1.01,0.4875391960144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,4,power_law_1.2,0.09345279932022095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,2,power_law_1.01,0.051046401262283325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,4,power_law_1.2,0.09106559753417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,4,power_law_1.01,0.6556928157806396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,2,power_law_1.2,0.01953279972076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,2,power_law_1.01,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,4,power_law_1.2,0.09003520011901855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,4,power_law_1.01,0.8773056030273437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,2,power_law_1.2,0.019731199741363524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,2,power_law_1.01,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,4,power_law_1.2,0.09352319836616516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,4,power_law_1.01,1.0095935821533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,2,power_law_1.2,0.02240640074014664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,2,power_law_1.01,0.06108800172805786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,4,power_law_1.2,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,4,power_law_1.01,1.6493951797485351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,2,power_law_1.01,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,2,power_law_1.2,0.027526399493217467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,4,power_law_1.2,0.10274560451507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,2,power_law_1.01,0.06173440217971802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,2,power_law_1.2,0.03386879861354828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,4,power_law_1.2,0.11789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,4,power_law_1.01,3.046329689025879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,2,power_law_1.01,0.06563199758529663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,2,power_law_1.2,0.04862079918384552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,4,power_law_1.2,0.1133952021598816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,2,power_law_1.01,0.07463039755821228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,2,power_law_1.2,0.05086719989776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,4,power_law_1.2,0.13141119480133057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,2,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,2,power_law_1.2,0.05333120226860046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,4,power_law_1.2,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,2,power_law_1.01,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,2,power_law_1.2,0.05804160237312317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,4,power_law_1.2,0.17114239931106567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,2,power_law_1.01,0.08730880022048951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,2,power_law_1.2,0.06398079991340637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,4,power_law_1.2,0.19244799613952637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,2,power_law_1.01,0.05175679922103882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,2,power_law_1.01,0.09081599712371827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,2,power_law_1.2,0.06970239877700805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,4,power_law_1.2,0.2493824005126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,2,power_law_1.01,0.05070719718933105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,2,power_law_1.01,0.10494719743728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,2,power_law_1.2,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,4,power_law_1.2,0.3026240110397339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,2,power_law_1.01,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,2,power_law_1.01,0.1381119966506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,2,power_law_1.2,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,4,power_law_1.2,0.42017278671264646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,2,power_law_1.01,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,2,power_law_1.01,0.15943039655685426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,2,power_law_1.2,0.07647359967231751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,2,power_law_1.01,0.0736191987991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,4,power_law_1.2,0.5133567810058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,2,power_law_1.01,0.22004480361938478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,2,power_law_1.2,0.07196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,2,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,4,power_law_1.2,0.8093055725097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,2,power_law_1.01,0.2661184072494507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,2,power_law_1.2,0.07769600152969361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,2,power_law_1.01,0.10641280412673951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,4,power_law_1.2,1.0026240348815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,2,power_law_1.01,0.40169601440429686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,2,power_law_1.2,0.08650879859924317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,2,power_law_1.01,0.11133439540863037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,4,power_law_1.2,1.2547327995300293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,2,power_law_1.01,0.49694080352783204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,2,power_law_1.2,0.09100800156593322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,2,power_law_1.01,0.10969599485397338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,2,power_law_1.01,0.7445375919342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,2,power_law_1.01,0.11584639549255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,4,power_law_1.2,2.0075775146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,2,power_law_1.2,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,2,power_law_1.01,0.1164736032485962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,2,power_law_1.2,0.1368831992149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,2,power_law_1.01,0.9026368141174317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,4,power_law_1.2,3.8876415252685548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,2,power_law_1.01,0.11687040328979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,2,power_law_1.2,0.15901440382003784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,2,power_law_1.01,1.1903743743896484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,2,power_law_1.01,0.12485760450363159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,2,power_law_1.2,0.2106175899505615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,2,power_law_1.01,1.8434816360473634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,2,power_law_1.01,0.12710399627685548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,2,power_law_1.2,0.2826751947402954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,2,power_law_1.01,0.13712639808654786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,2,power_law_1.01,3.6844287872314454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,2,power_law_1.2,0.36625919342041013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,2,power_law_1.01,0.13756799697875977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,2,power_law_1.2,0.47358078956604005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,2,power_law_1.2,0.053990399837493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,2,power_law_1.01,0.15189119577407836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,2,power_law_1.2,0.7396031856536865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,2,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,2,power_law_1.01,0.17627520561218263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,2,power_law_1.2,0.9788288116455078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,2,power_law_1.2,0.054201602935791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,2,power_law_1.01,0.18405120372772216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,2,power_law_1.2,0.06320000290870667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,2,power_law_1.2,1.2870400428771973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,2,power_law_1.01,0.22480640411376954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,2,power_law_1.2,0.07345280051231384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,2,power_law_1.01,0.2604351997375488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,2,power_law_1.2,1.951411247253418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,2,power_law_1.2,0.10212479829788208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,2,power_law_1.01,0.32493441104888915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,2,power_law_1.2,0.10887680053710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,2,power_law_1.2,3.743814468383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,2,power_law_1.01,0.4074560165405273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,8,power_law_1.01,0.05518720149993896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,2,power_law_1.2,0.11420799493789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,2,power_law_1.01,0.5608640193939209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,8,power_law_1.01,0.07545599937438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,2,power_law_1.2,0.11093120574951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,8,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,2,power_law_1.01,0.7195903778076171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,2,power_law_1.2,0.11604479551315308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,8,power_law_1.01,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,2,power_law_1.01,0.9907327651977539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,2,power_law_1.2,0.1211583971977234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,8,power_law_1.01,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,2,power_law_1.01,1.2522687911987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,2,power_law_1.2,0.12260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,8,power_law_1.01,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,2,power_law_1.01,1.5760640144348144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,2,power_law_1.2,0.12607359886169434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,8,power_law_1.01,0.09797120094299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,2,power_law_1.01,2.5496896743774413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,2,power_law_1.2,0.12773120403289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,8,power_law_1.01,0.10718719959259033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,8,power_law_1.2,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,2,power_law_1.2,0.1375488042831421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,8,power_law_1.01,0.11497600078582763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,2,power_law_1.01,4.701113510131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,8,power_law_1.2,0.04287999868392944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,8,power_law_1.01,0.12891520261764527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,2,power_law_1.2,0.14574719667434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,8,power_law_1.2,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,8,power_law_1.01,0.14837119579315186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,2,power_law_1.2,0.15537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,8,power_law_1.2,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,8,power_law_1.01,0.1725376009941101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,2,power_law_1.2,0.1725823998451233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,8,power_law_1.2,0.06746240258216858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,8,power_law_1.01,0.13730560541152953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,2,power_law_1.2,0.19017599821090697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,8,power_law_1.2,0.09122560024261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,8,power_law_1.01,0.15841280221939086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,2,power_law_1.2,0.22725119590759277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,8,power_law_1.01,0.10028159618377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,8,power_law_1.01,0.18154879808425903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,8,power_law_1.2,0.0934719979763031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,2,power_law_1.2,0.2510080099105835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,8,power_law_1.01,0.11461119651794434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,8,power_law_1.01,0.14550399780273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,8,power_law_1.2,0.1102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,2,power_law_1.2,0.34112000465393066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,8,power_law_1.01,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,8,power_law_1.01,0.167193603515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,8,power_law_1.2,0.11967999935150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,2,power_law_1.2,0.422214412689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,8,power_law_1.01,0.09886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,8,power_law_1.01,0.22780799865722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,8,power_law_1.2,0.12870399951934813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,2,power_law_1.2,0.6018239974975585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,8,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.01,0.2896768093109131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,8,power_law_1.2,0.14547840356826783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,2,power_law_1.2,0.7289984226226807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,8,power_law_1.01,0.13182079792022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.01,0.39022719860076904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,8,power_law_1.2,0.17560319900512694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,8,power_law_1.01,0.13960959911346435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,2,power_law_1.2,1.0108287811279297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.01,0.49610238075256347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,8,power_law_1.2,0.13524479866027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,8,power_law_1.01,0.14185600280761718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,2,power_law_1.2,1.4493056297302247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.01,0.70316162109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,8,power_law_1.2,0.16227840185165404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,8,power_law_1.01,0.1430848002433777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,2,power_law_1.2,1.6872831344604493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.01,0.9399040222167969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,8,power_law_1.01,0.14041600227355958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,8,power_law_1.2,0.18522239923477174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,2,power_law_1.2,2.456307220458984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.01,1.3574912071228027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,8,power_law_1.01,0.1547711968421936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,8,power_law_1.2,0.14916479587554932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,8,power_law_1.2,0.17292799949645996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,8,power_law_1.01,0.1502527952194214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.01,1.785318374633789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,2,power_law_1.2,6.223571014404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,8,power_law_1.2,0.23785600662231446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,8,power_law_1.01,0.1541440010070801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.01,2.6413888931274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,8,power_law_1.01,0.1557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.2,0.2958143949508667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.01,3.4290496826171877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,8,power_law_1.01,0.16457600593566896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.2,0.39288959503173826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,8,power_law_1.01,4.414745712280274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,8,power_law_1.01,0.17196799516677858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.2,0.52641282081604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,8,power_law_1.01,0.18302079439163207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.2,0.7682752132415771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,8,power_law_1.01,7.102130889892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,8,power_law_1.2,0.10027519464492798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,8,power_law_1.01,0.2059648036956787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.2,0.94399995803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,8,power_law_1.2,0.0890175998210907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,8,power_law_1.01,14.298605346679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.01,0.2301248073577881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,8,power_law_1.2,0.0804095983505249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.2,1.5035264015197753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.01,0.26657280921936033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,8,power_law_1.2,0.09639040231704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.2,1.9395263671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.01,0.29852159023284913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,8,power_law_1.2,0.1012992024421692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.2,2.8791488647460937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.01,0.36959359645843504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,8,power_law_1.2,0.13425920009613038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.2,4.038118362426758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,4,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,8,power_law_1.2,0.14491519927978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.01,0.451910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,8,power_law_1.2,4.546636962890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,4,power_law_1.01,0.04020479917526245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,8,power_law_1.2,0.14083199501037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.01,0.5809408187866211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,4,power_law_1.01,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,8,power_law_1.2,0.14636160135269166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.01,0.7052544116973877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,8,power_law_1.2,7.976217651367188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,4,power_law_1.01,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,8,power_law_1.2,0.14574079513549804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.01,0.9305407524108886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,4,power_law_1.01,0.06501759886741638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,8,power_law_1.2,0.1502527952194214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.01,1.2605183601379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,8,power_law_1.2,15.561593627929687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,4,power_law_1.01,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,8,power_law_1.2,0.15229439735412598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,8,power_law_1.01,1.5072511672973632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,4,power_law_1.01,0.09959679841995239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,8,power_law_1.2,0.15393279790878295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,4,power_law_1.01,0.1016767978668213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,8,power_law_1.01,2.2574464797973635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,8,power_law_1.2,0.15960960388183593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,4,power_law_1.01,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,8,power_law_1.2,0.1674496054649353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,4,power_law_1.2,0.03612160086631775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,8,power_law_1.01,4.89997444152832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,4,power_law_1.01,0.11191040277481079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,8,power_law_1.2,0.18360960483551025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,4,power_law_1.2,0.027923199534416198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,4,power_law_1.01,0.1301375985145569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,8,power_law_1.2,0.1955072045326233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,4,power_law_1.2,0.038387200236320494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,4,power_law_1.01,0.14177919626235963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,8,power_law_1.2,0.21946239471435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,4,power_law_1.2,0.05189759731292724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,4,power_law_1.01,0.12336640357971192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.2,0.22827520370483398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,4,power_law_1.2,0.059680002927780154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,4,power_law_1.01,0.13667839765548706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.2,0.2891135931015015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,4,power_law_1.2,0.08915839791297912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,4,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,4,power_law_1.01,0.1510208010673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.2,0.30138239860534666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,4,power_law_1.2,0.10084480047225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,4,power_law_1.01,0.08944000005722046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,4,power_law_1.01,0.12725759744644166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.2,0.3708224058151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,4,power_law_1.2,0.10040960311889649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,4,power_law_1.01,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,4,power_law_1.01,0.1540992021560669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.2,0.4752768039703369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,4,power_law_1.2,0.10533759593963624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,4,power_law_1.01,0.08984959721565247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,4,power_law_1.01,0.19731839895248413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.2,0.6075776100158692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,4,power_law_1.2,0.11352959871292115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,4,power_law_1.01,0.2292479991912842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,4,power_law_1.01,0.10702719688415527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.2,0.7966015815734864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,4,power_law_1.2,0.13073279857635497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,4,power_law_1.01,0.14432640075683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,4,power_law_1.01,0.2953984022140503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.2,1.2690624237060546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,4,power_law_1.2,0.1463039994239807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,4,power_law_1.01,0.1492416024208069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,4,power_law_1.01,0.3642303943634033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,4,power_law_1.2,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,4,power_law_1.01,0.14984960556030275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,4,power_law_1.01,0.514137601852417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.2,1.5498496055603028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,4,power_law_1.2,0.13727999925613404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,4,power_law_1.01,0.15804799795150756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,4,power_law_1.01,0.6449984073638916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,8,power_law_1.2,1.8127935409545899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,4,power_law_1.2,0.15489920377731323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,4,power_law_1.01,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,4,power_law_1.01,0.9509696006774903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,8,power_law_1.2,2.979987144470215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,4,power_law_1.2,0.13360639810562133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,4,power_law_1.01,0.16254080533981324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,4,power_law_1.01,1.2292287826538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,4,power_law_1.2,0.14915839433670045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,4,power_law_1.01,0.16807680130004882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,4,power_law_1.01,1.8864896774291993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,8,power_law_1.2,6.290361785888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,4,power_law_1.2,0.20119040012359618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,4,power_law_1.01,0.16807680130004882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,4,power_law_1.01,2.435353660583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,4,power_law_1.01,0.17768959999084472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,4,power_law_1.2,0.24133760929107667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,4,power_law_1.01,2.898406410217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,4,power_law_1.01,0.18485759496688842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,4,power_law_1.2,0.3269439935684204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,4,power_law_1.01,0.19122560024261476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,4,power_law_1.2,0.3529599905014038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,4,power_law_1.01,4.7477375030517575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,4,power_law_1.01,0.19918080568313598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,4,power_law_1.2,0.5100287914276123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,4,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,4,power_law_1.01,9.905241394042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,4,power_law_1.01,0.23011839389801025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,4,power_law_1.2,0.6912767887115479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,4,power_law_1.2,0.07036799788475037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,4,power_law_1.01,0.25715839862823486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,4,power_law_1.2,0.9763584136962891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,4,power_law_1.2,0.0761023998260498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,4,power_law_1.01,0.3005631923675537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,4,power_law_1.2,1.3554431915283203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,4,power_law_1.2,0.0902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,4,power_law_1.01,0.31676158905029295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,4,power_law_1.2,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,4,power_law_1.2,1.907583999633789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,4,power_law_1.01,0.39518721103668214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,4,power_law_1.2,0.14206720590591432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,2,power_law_1.01,0.026719999313354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,4,power_law_1.2,2.598374366760254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,4,power_law_1.01,0.4728127956390381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,4,power_law_1.2,0.15105279684066772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,2,power_law_1.01,0.034297600388526917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,4,power_law_1.2,3.286092758178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,4,power_law_1.2,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,4,power_law_1.01,0.6499775886535645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,2,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,4,power_law_1.2,5.231692886352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,4,power_law_1.2,0.15639679431915282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,2,power_law_1.01,0.06969599723815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,4,power_law_1.01,0.769152021408081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,4,power_law_1.2,0.16499840021133422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,2,power_law_1.01,0.09059839844703674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,4,power_law_1.01,1.1494720458984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,4,power_law_1.2,10.413337707519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,4,power_law_1.2,0.16581759452819825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,2,power_law_1.01,0.09081599712371827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,4,power_law_1.01,1.444377613067627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,4,power_law_1.2,0.16582399606704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,2,power_law_1.01,0.09591680169105529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,4,power_law_1.01,1.5690943717956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,4,power_law_1.2,0.1727679967880249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,2,power_law_1.01,0.10781439542770385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,4,power_law_1.01,2.7878719329833985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,2,power_law_1.01,0.11292159557342529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,4,power_law_1.2,0.18178559541702272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,2,power_law_1.01,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,4,power_law_1.2,0.19285119771957399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,2,power_law_1.2,0.026502400636672974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,4,power_law_1.01,5.408089447021484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,2,power_law_1.01,0.12400000095367432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,4,power_law_1.2,0.19816960096359254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,2,power_law_1.2,0.02917119860649109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,2,power_law_1.01,0.13648639917373656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,4,power_law_1.2,0.2051392078399658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,2,power_law_1.2,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,2,power_law_1.01,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,4,power_law_1.2,0.2329792022705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,2,power_law_1.2,0.0639743983745575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,2,power_law_1.01,0.12952959537506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,4,power_law_1.2,0.25264639854431153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,2,power_law_1.2,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,2,power_law_1.01,0.14833279848098754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,4,power_law_1.2,0.30261759757995604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,2,power_law_1.2,0.08731520175933838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,2,power_law_1.01,0.14816000461578369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,4,power_law_1.2,0.3310976028442383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,2,power_law_1.2,0.09674879908561707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,2,power_law_1.01,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,2,power_law_1.2,0.10533759593963624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,2,power_law_1.01,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,4,power_law_1.2,0.43430399894714355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,2,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,2,power_law_1.01,0.1761791944503784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,4,power_law_1.2,0.48101119995117186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,2,power_law_1.01,0.08391039967536926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,2,power_law_1.01,0.20405120849609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,4,power_law_1.2,0.6614208221435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,2,power_law_1.01,0.11093759536743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,2,power_law_1.01,0.25956480503082274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,4,power_law_1.2,0.8568191528320312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,2,power_law_1.01,0.13653759956359862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,2,power_law_1.01,0.3048192024230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,4,power_law_1.2,1.1846912384033204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,2,power_law_1.01,0.17053439617156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,2,power_law_1.01,0.4211264133453369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,4,power_law_1.2,1.440281581878662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,2,power_law_1.01,0.17811199426651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,2,power_law_1.01,0.5309375762939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,4,power_law_1.2,1.9268863677978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,2,power_law_1.01,0.19407360553741454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,2,power_law_1.01,0.745363187789917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,4,power_law_1.2,2.8767488479614256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,2,power_law_1.01,0.2012415885925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,2,power_law_1.01,0.9796544075012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,2,power_law_1.01,0.20248959064483643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,2,power_law_1.01,1.404595184326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,4,power_law_1.2,6.451321411132812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,2,power_law_1.01,0.21210238933563233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,2,power_law_1.01,1.8746112823486327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,2,power_law_1.01,0.21476480960845948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,2,power_law_1.01,2.375545692443848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,2,power_law_1.01,0.21701760292053224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,2,power_law_1.01,0.2227008104324341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,2,power_law_1.01,3.7798721313476564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,2,power_law_1.01,0.2411776065826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,2,power_law_1.01,7.265542602539062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,2,power_law_1.01,0.2473344087600708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,2,power_law_1.01,0.26330881118774413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,2,power_law_1.2,0.07487360239028931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,2,power_law_1.01,0.30058879852294923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,2,power_law_1.2,0.07406079769134521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,2,power_law_1.01,0.32330238819122314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,2,power_law_1.2,0.08409600257873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,2,power_law_1.01,0.3677567958831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,2,power_law_1.2,0.10191359519958496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,2,power_law_1.01,0.4238719940185547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,2,power_law_1.2,0.11605119705200195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,8,power_law_1.01,0.10126719474792481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,2,power_law_1.01,0.545305585861206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,2,power_law_1.2,0.17768959999084472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,8,power_law_1.01,0.14325120449066162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,2,power_law_1.2,0.18934400081634523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,2,power_law_1.01,0.6614399909973144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,8,power_law_1.01,0.20796799659729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,2,power_law_1.2,0.19345279932022094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,2,power_law_1.01,0.8383808135986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,2,power_law_1.2,0.20453119277954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,8,power_law_1.01,0.09387519955635071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,2,power_law_1.01,1.0403136253356933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,2,power_law_1.2,0.20432000160217284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,8,power_law_1.01,0.1264575958251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,2,power_law_1.01,1.431283187866211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,2,power_law_1.2,0.21373438835144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,8,power_law_1.01,0.15205119848251342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,2,power_law_1.01,1.8234687805175782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,2,power_law_1.2,0.21866240501403808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,8,power_law_1.01,0.1641343951225281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,2,power_law_1.01,2.2599103927612303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,2,power_law_1.2,0.2235647916793823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,8,power_law_1.01,0.20079998970031737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,2,power_law_1.2,0.22970240116119384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,2,power_law_1.01,3.4221248626708984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,2,power_law_1.2,0.2462912082672119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,8,power_law_1.01,0.21923201084136962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,2,power_law_1.2,0.24466559886932374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,2,power_law_1.01,6.944499206542969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,8,power_law_1.01,0.22023680210113525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,2,power_law_1.2,0.271891188621521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,8,power_law_1.01,0.22389121055603028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,2,power_law_1.2,0.3081536054611206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,8,power_law_1.01,0.23170559406280516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,2,power_law_1.2,0.32515840530395507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,2,power_law_1.2,0.3943615913391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,8,power_law_1.01,0.22865281105041504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,2,power_law_1.2,0.439577579498291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,8,power_law_1.01,0.23929600715637206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,8,power_law_1.2,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,2,power_law_1.2,0.5584191799163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,8,power_law_1.01,0.25077118873596194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,8,power_law_1.2,0.13898240327835082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,2,power_law_1.2,0.6577536106109619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,8,power_law_1.01,0.25363199710845946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,8,power_law_1.2,0.1221824049949646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,2,power_law_1.2,0.8396160125732421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,8,power_law_1.01,0.264684796333313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,8,power_law_1.2,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,2,power_law_1.2,1.0042624473571777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,8,power_law_1.01,0.29356799125671384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,8,power_law_1.2,0.12405120134353638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,2,power_law_1.2,1.5379648208618164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,8,power_law_1.01,0.30456318855285647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,8,power_law_1.2,0.1441151976585388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,2,power_law_1.2,2.0153663635253904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,8,power_law_1.01,0.3531584024429321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,8,power_law_1.2,0.15762560367584227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,2,power_law_1.2,2.362495994567871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,8,power_law_1.01,0.41768321990966795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,8,power_law_1.2,0.1907904028892517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,2,power_law_1.2,3.4442367553710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,8,power_law_1.01,0.5075456142425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,8,power_law_1.2,0.2024768114089966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,2,power_law_1.2,7.456249237060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,8,power_law_1.01,0.5251967906951904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,8,power_law_1.2,0.21333119869232178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,8,power_law_1.2,0.21067519187927247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,8,power_law_1.01,0.6589375972747803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,8,power_law_1.2,0.22274560928344728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,8,power_law_1.01,0.8043328285217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,8,power_law_1.2,0.23299839496612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,8,power_law_1.01,1.0765055656433105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,8,power_law_1.2,0.2309312105178833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,8,power_law_1.01,1.3980607986450195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,4,power_law_1.01,0.08369280099868774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,8,power_law_1.2,0.24486401081085205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,8,power_law_1.01,1.6968448638916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,4,power_law_1.01,0.11276160478591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,8,power_law_1.2,0.24834558963775635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,8,power_law_1.01,2.528940773010254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,4,power_law_1.01,0.1580288052558899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,8,power_law_1.2,0.26863999366760255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,4,power_law_1.01,0.10601600408554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,8,power_law_1.2,0.28910079002380373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,8,power_law_1.01,4.701785659790039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,4,power_law_1.01,0.12629760503768922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,8,power_law_1.2,0.3083584070205688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,4,power_law_1.01,0.16561919450759888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,8,power_law_1.2,0.3739007949829102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,4,power_law_1.01,0.18793599605560302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,8,power_law_1.2,0.4001023769378662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,4,power_law_1.01,0.22602241039276122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,8,power_law_1.2,0.48592000007629393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,4,power_law_1.01,0.24014720916748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,8,power_law_1.2,0.5600575923919677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,4,power_law_1.2,0.08405759930610657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,4,power_law_1.01,0.25306239128112795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,8,power_law_1.2,0.732697582244873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,4,power_law_1.2,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,4,power_law_1.01,0.24895999431610108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,8,power_law_1.2,0.8985983848571777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,4,power_law_1.2,0.11185920238494873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,4,power_law_1.01,0.2751807928085327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,4,power_law_1.2,0.10208640098571778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,8,power_law_1.2,1.262118434906006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,4,power_law_1.01,0.2772543907165527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,4,power_law_1.2,0.12602880001068115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,8,power_law_1.2,1.574028778076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,4,power_law_1.01,0.27435519695281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,4,power_law_1.2,0.15758719444274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,8,power_law_1.2,1.8853248596191405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,4,power_law_1.01,0.28664960861206057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,4,power_law_1.2,0.17786240577697754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,8,power_law_1.2,2.798534393310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,4,power_law_1.01,0.2995392084121704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,4,power_law_1.2,0.22087039947509765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,4,power_law_1.01,0.30755200386047366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,4,power_law_1.2,0.22926080226898193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,8,power_law_1.2,5.846361541748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,4,power_law_1.01,0.34481918811798096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,4,power_law_1.2,0.2440256118774414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,4,power_law_1.01,0.36694400310516356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,4,power_law_1.2,0.24216959476470948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,4,power_law_1.01,0.42734718322753906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,4,power_law_1.2,0.2538367986679077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,4,power_law_1.01,0.4683135986328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,4,power_law_1.2,0.27165439128875735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,4,power_law_1.01,0.574399995803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,4,power_law_1.2,0.27820799350738523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,4,power_law_1.01,0.6296832084655761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,4,power_law_1.2,0.2827136039733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,2,power_law_1.01,0.08717439770698547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,4,power_law_1.01,0.7756991863250733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,4,power_law_1.2,0.30135679244995117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,2,power_law_1.01,0.10046720504760742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,4,power_law_1.01,0.9575743675231934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,4,power_law_1.2,0.30624639987945557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,2,power_law_1.01,0.14042240381240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,4,power_law_1.2,0.3523519992828369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,4,power_law_1.01,1.3096192359924317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,2,power_law_1.01,0.1205631971359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,4,power_law_1.2,0.39241600036621094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,4,power_law_1.01,1.5764736175537108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,2,power_law_1.01,0.16745599508285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,4,power_law_1.2,0.43466877937316895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,4,power_law_1.01,1.9969087600708009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,2,power_law_1.01,0.218451189994812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,4,power_law_1.2,0.476032018661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,4,power_law_1.01,3.149760055541992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,2,power_law_1.01,0.2430272102355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,4,power_law_1.2,0.6283904075622558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,2,power_law_1.01,0.2882879972457886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,4,power_law_1.2,0.6634431838989258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,4,power_law_1.01,5.492051315307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,2,power_law_1.01,0.30180480480194094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,4,power_law_1.2,0.8293120384216308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,2,power_law_1.01,0.3179840087890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,4,power_law_1.2,1.0202048301696778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,2,power_law_1.01,0.33130879402160646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,4,power_law_1.2,1.3468607902526855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,2,power_law_1.01,0.34686079025268557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,4,power_law_1.2,1.6825088500976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,2,power_law_1.01,0.3546432018280029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,2,power_law_1.01,0.3615936040878296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,4,power_law_1.2,2.0484287261962892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,2,power_law_1.2,0.09126399755477906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,2,power_law_1.01,0.36528639793395995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,4,power_law_1.2,3.1150848388671877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,2,power_law_1.2,0.10253440141677857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,2,power_law_1.01,0.3892607927322388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,2,power_law_1.2,0.10725760459899902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,2,power_law_1.01,0.40830721855163576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,4,power_law_1.2,6.536255645751953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,2,power_law_1.2,0.12075519561767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,2,power_law_1.01,0.4576704025268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,2,power_law_1.2,0.1546880006790161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,2,power_law_1.01,0.4871551990509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,2,power_law_1.2,0.2006335973739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,2,power_law_1.01,0.5678463935852051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,2,power_law_1.2,0.21906559467315673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,2,power_law_1.01,0.6372672080993652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,2,power_law_1.2,0.29402239322662355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,2,power_law_1.01,0.769977617263794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,2,power_law_1.2,0.30220799446105956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,2,power_law_1.01,0.8451519966125488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,2,power_law_1.2,0.3042623996734619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,2,power_law_1.01,1.1113856315612793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,2,power_law_1.2,0.11845120191574096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,2,power_law_1.2,0.33703041076660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,2,power_law_1.01,1.293241596221924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,2,power_law_1.2,0.12337280511856079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,1,power_law_1.01,0.10840320587158203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,2,power_law_1.2,0.3333247900009155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,2,power_law_1.01,1.7739072799682618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,2,power_law_1.2,0.12461440563201905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,1,power_law_1.01,0.11887999773025512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,2,power_law_1.2,0.3603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,2,power_law_1.2,0.1376960039138794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,2,power_law_1.01,2.2197568893432615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,1,power_law_1.01,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,2,power_law_1.2,0.3574975967407227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,2,power_law_1.2,0.13216639757156373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,2,power_law_1.01,2.6557823181152345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,1,power_law_1.01,0.16656639575958251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,2,power_law_1.2,0.3763520002365112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,2,power_law_1.2,0.13443200588226317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,2,power_law_1.2,0.1481152057647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,1,power_law_1.01,0.23990399837493898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,2,power_law_1.01,3.9871871948242186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,2,power_law_1.2,0.3929343938827515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,2,power_law_1.2,0.1471295952796936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,2,power_law_1.2,0.4210048198699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,1,power_law_1.01,0.295411205291748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,2,power_law_1.01,7.627097320556641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,2,power_law_1.2,0.14549119472503663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,1,power_law_1.01,0.34967041015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,2,power_law_1.2,0.4592832088470459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,2,power_law_1.2,0.18193279504776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,1,power_law_1.01,0.43016958236694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,2,power_law_1.2,0.4961535930633545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,2,power_law_1.2,0.2110208034515381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,1,power_law_1.01,0.4395967960357666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,2,power_law_1.2,0.5682432174682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,2,power_law_1.2,0.25661439895629884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,2,power_law_1.2,0.33103361129760744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,1,power_law_1.01,0.4588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,2,power_law_1.2,0.6548672199249268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,2,power_law_1.2,0.4436863899230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,1,power_law_1.01,0.4993599891662598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,2,power_law_1.2,0.7847104072570801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,2,power_law_1.2,0.5329728126525879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,1,power_law_1.01,0.5153600215911865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,2,power_law_1.2,0.8834303855895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,2,power_law_1.2,0.7736127853393555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,1,power_law_1.01,0.5235648155212402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,2,power_law_1.2,1.1031935691833497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,2,power_law_1.2,1.0537664413452148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,1,power_law_1.01,0.5325632095336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,2,power_law_1.2,1.2924160003662108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,2,power_law_1.2,1.4217727661132813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,1,power_law_1.2,0.10971519947052003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,1,power_law_1.01,0.5518271923065186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,2,power_law_1.2,1.8161088943481445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,2,power_law_1.2,1.9190528869628907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,1,power_law_1.2,0.11747839450836181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,1,power_law_1.01,0.5600063800811768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,2,power_law_1.2,2.3330175399780275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,2,power_law_1.2,2.4406911849975588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,1,power_law_1.2,0.1305791974067688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,1,power_law_1.01,0.596454381942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,2,power_law_1.2,2.7747583389282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,2,power_law_1.2,4.043865585327149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,1,power_law_1.2,0.16090879440307618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,1,power_law_1.01,0.6712192058563232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,2,power_law_1.2,4.055782318115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,1,power_law_1.2,0.22438399791717528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,1,power_law_1.01,0.7277440071105957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,2,power_law_1.2,7.94295654296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,1,power_law_1.2,0.2731328010559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,1,power_law_1.01,0.8645376205444336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,2,power_law_1.2,7.976614379882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,1,power_law_1.2,0.31111679077148435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,1,power_law_1.01,0.9481023788452149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,1,power_law_1.2,0.410752010345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,1,power_law_1.01,1.171884822845459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,1,power_law_1.2,0.42897920608520507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,1,power_law_1.01,1.3406399726867675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,1,power_law_1.2,0.4506944179534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,1,power_law_1.01,1.7177536010742187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,1,power_law_1.2,0.4556159973144531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,1,power_law_1.01,1.9878656387329101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,1,power_law_1.2,0.4994495868682861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,1,power_law_1.01,2.715123176574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,1,power_law_1.2,0.5096896171569825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,1,power_law_1.01,3.4396095275878906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,1,power_law_1.2,0.5174464225769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,1,power_law_1.01,4.150348663330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,1,power_law_1.2,0.5453184127807618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,1,power_law_1.2,0.5522304058074952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,1,power_law_1.01,6.273100662231445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,1,power_law_1.2,0.6022528171539306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,1,power_law_1.01,12.075494384765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,1,power_law_1.2,0.6929791927337646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,1,power_law_1.2,0.7400896072387695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,1,power_law_1.2,0.8730943679809571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,1,power_law_1.2,0.9489791870117188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,1,power_law_1.2,1.1720128059387207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,1,power_law_1.2,1.3280575752258301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,1,power_law_1.2,1.7132415771484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,1,power_law_1.2,2.077631950378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,1,power_law_1.2,2.7595136642456053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,1,power_law_1.2,3.4512256622314452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,1,power_law_1.2,4.171308898925782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,1,power_law_1.2,6.296915054321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,1,power_law_1.2,12.188947296142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,power_law_1.01,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,power_law_1.01,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,power_law_1.01,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,power_law_1.2,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,power_law_1.01,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,power_law_1.2,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,power_law_1.01,0.06214399933815003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,power_law_1.01,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,power_law_1.01,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,power_law_1.2,0.06177279949188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,power_law_1.01,0.07278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,power_law_1.2,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,power_law_1.01,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,power_law_1.2,0.06997119784355163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,power_law_1.2,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,power_law_1.01,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,power_law_1.2,0.08961920142173767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,power_law_1.01,0.09879040122032165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,power_law_1.2,0.08717439770698547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,power_law_1.01,0.11947519779205322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,power_law_1.2,0.070796799659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,power_law_1.01,0.1366719961166382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,power_law_1.2,0.08060799837112427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,power_law_1.01,0.09059839844703674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,power_law_1.2,0.08266879916191101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,power_law_1.01,0.10577280521392822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,power_law_1.2,0.09044479727745056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,power_law_1.01,0.11352959871292115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,power_law_1.2,0.11176960468292237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,power_law_1.01,0.12092159986495972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,power_law_1.2,0.11358720064163208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,power_law_1.01,0.15960320234298705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,power_law_1.2,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,power_law_1.01,0.17477760314941407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,power_law_1.01,0.05559679865837097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,power_law_1.2,0.17093119621276856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,power_law_1.01,0.239084792137146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,power_law_1.01,0.06133120059967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,power_law_1.2,0.17748479843139647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,power_law_1.01,0.33408639430999754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,power_law_1.01,0.06092159748077393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,power_law_1.2,0.25326080322265626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,power_law_1.01,0.48586239814758303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,power_law_1.2,0.3083584070205688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,power_law_1.01,0.5464831829071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,power_law_1.01,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,power_law_1.2,0.4400383949279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,power_law_1.01,0.8674112319946289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,power_law_1.01,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,power_law_1.2,0.5932352066040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,power_law_1.01,1.0410688400268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,power_law_1.01,0.07155200242996215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,power_law_1.2,0.7900415897369385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,power_law_1.01,1.678816032409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,power_law_1.01,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,power_law_1.2,1.0921216011047363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,power_law_1.01,2.1447423934936523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,power_law_1.01,0.07504640221595764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,power_law_1.2,1.7906879425048827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,power_law_1.01,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,power_law_1.01,3.076140785217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,power_law_1.2,2.4333568572998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,power_law_1.01,0.07279360294342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,power_law_1.01,4.574073410034179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,power_law_1.2,2.9435199737548827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,power_law_1.01,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,power_law_1.01,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,power_law_1.2,4.980172729492187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,power_law_1.01,9.591667175292969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,power_law_1.01,0.08937600255012512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,power_law_1.2,10.341926574707031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,power_law_1.01,0.09082239866256714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,power_law_1.01,0.10044159889221191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,power_law_1.01,0.12338559627532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,power_law_1.01,0.1590208053588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,power_law_1.2,0.06136959791183472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,power_law_1.01,0.17905280590057374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,power_law_1.2,0.06280959844589233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,power_law_1.01,0.21430399417877197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,power_law_1.01,0.37569279670715333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,power_law_1.2,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,power_law_1.01,0.45392642021179197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,power_law_1.2,0.06117759943008423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,power_law_1.01,0.7924672126770019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,power_law_1.2,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,power_law_1.01,0.9030591964721679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,power_law_1.2,0.06772480010986329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,power_law_1.01,1.1957183837890626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,power_law_1.2,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,power_law_1.2,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,power_law_1.01,2.0161344528198244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,power_law_1.01,1.7644479751586915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,power_law_1.2,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,power_law_1.01,3.200896072387695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,power_law_1.2,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,power_law_1.01,6.868447875976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,power_law_1.2,0.07121279835700989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,power_law_1.2,0.0810368001461029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,power_law_1.2,0.08921599984169007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,power_law_1.2,0.0896448016166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,power_law_1.2,0.10622719526290894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,power_law_1.2,0.13879679441452025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,power_law_1.2,0.1535423994064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,power_law_1.2,0.21476480960845948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,power_law_1.2,0.23401598930358886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,power_law_1.2,0.3299839973449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,power_law_1.2,0.47282562255859373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,power_law_1.2,0.6712768077850342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,power_law_1.2,1.01527681350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,power_law_1.2,1.289568042755127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,power_law_1.2,1.957209587097168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,power_law_1.2,2.646777534484863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,power_law_1.2,3.2972030639648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,power_law_1.2,8.410591888427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,power_law_1.01,0.048819199204444885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,power_law_1.01,0.04614399969577789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,power_law_1.2,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,power_law_1.01,0.049446401000022885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,power_law_1.2,0.04867840111255646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,power_law_1.01,0.0602944016456604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,power_law_1.01,0.06111360192298889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,power_law_1.01,0.06439039707183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,power_law_1.01,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,power_law_1.2,0.06053119897842407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,power_law_1.01,0.06336640119552613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,power_law_1.01,0.06312959790229797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,power_law_1.2,0.06116480231285095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,power_law_1.01,0.06664959788322448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,power_law_1.2,0.06689919829368592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,power_law_1.01,0.06726400256156921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,power_law_1.2,0.06625919938087463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,power_law_1.01,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,power_law_1.2,0.06586880087852479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,power_law_1.01,0.07094399929046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,power_law_1.2,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,power_law_1.01,0.06929280161857605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,power_law_1.01,0.08343679904937744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,power_law_1.2,0.07078400254249573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,power_law_1.01,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,power_law_1.2,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,power_law_1.01,0.0930624008178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,power_law_1.2,0.08776320219039917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,power_law_1.01,0.10678399801254272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,power_law_1.01,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,power_law_1.2,0.09536640048027038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,power_law_1.01,0.11518080234527588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,power_law_1.01,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,power_law_1.2,0.11809279918670654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,power_law_1.01,0.15367679595947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,power_law_1.2,0.12097920179367065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,power_law_1.01,0.18154239654541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,power_law_1.01,0.058457601070404056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,power_law_1.2,0.15557119846343995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,power_law_1.01,0.23415679931640626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,power_law_1.01,0.05559679865837097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,power_law_1.2,0.19325439929962157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,power_law_1.01,0.2976639986038208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,power_law_1.01,0.0621504008769989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,power_law_1.2,0.23114240169525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,power_law_1.01,0.4293375968933105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,power_law_1.01,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,power_law_1.2,0.30589439868927004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,power_law_1.01,0.585811185836792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,power_law_1.01,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,power_law_1.2,0.46051840782165526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,power_law_1.01,0.7146175861358642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,power_law_1.01,0.065830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,power_law_1.2,0.4793600082397461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,power_law_1.01,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,power_law_1.01,1.161292839050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,power_law_1.2,0.8592767715454102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,power_law_1.01,0.06378880143165588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,power_law_1.01,1.3673088073730468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,power_law_1.2,1.0970303535461425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,power_law_1.01,0.06870399713516236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,power_law_1.01,2.4193727493286135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,power_law_1.2,1.5834367752075196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,power_law_1.01,0.07379199862480164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,power_law_1.2,2.259891128540039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,power_law_1.01,3.584889602661133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,power_law_1.01,0.06973440051078797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,power_law_1.01,0.0834496021270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,power_law_1.2,4.508185577392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,power_law_1.01,0.08570240139961242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,power_law_1.2,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,power_law_1.01,0.08529279828071594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,power_law_1.2,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,power_law_1.01,0.10165760517120362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,power_law_1.2,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,power_law_1.01,0.11025919914245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,power_law_1.2,0.055238401889801024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,power_law_1.01,0.13362560272216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,power_law_1.2,0.05708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,power_law_1.01,0.15880320072174073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,power_law_1.01,0.20364799499511718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,power_law_1.2,0.05931519865989685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,power_law_1.01,0.25178239345550535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,power_law_1.2,0.06097279787063599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,power_law_1.01,0.3404736042022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,power_law_1.2,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,power_law_1.01,0.4416384220123291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,power_law_1.2,0.07018240094184876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,power_law_1.01,0.6337408065795899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,power_law_1.2,0.0677183985710144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,power_law_1.01,0.8330047607421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,power_law_1.2,0.07346559762954712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,power_law_1.01,1.032902431488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,power_law_1.2,0.07306240200996399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,power_law_1.01,1.6186304092407227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,power_law_1.01,3.30371208190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,power_law_1.2,0.08144639730453491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,power_law_1.2,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,power_law_1.2,0.08451840281486511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,power_law_1.2,0.10151040554046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,power_law_1.2,0.11094399690628051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,power_law_1.2,0.13264000415802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,power_law_1.2,0.1547711968421936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,power_law_1.2,0.20346879959106445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,power_law_1.2,0.2512255907058716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,power_law_1.2,0.33948800563812254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,power_law_1.2,0.4425151824951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,power_law_1.2,0.6364480018615722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,power_law_1.2,0.8363455772399903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,power_law_1.2,1.0488575935363769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,power_law_1.2,1.7149375915527343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,power_law_1.2,3.3721729278564454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,power_law_1.01,0.0844543993473053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,power_law_1.01,0.09675520062446594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,power_law_1.2,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,power_law_1.01,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,power_law_1.2,0.09639040231704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,power_law_1.01,0.08321920037269592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,power_law_1.2,0.08409600257873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,power_law_1.01,0.09838079810142517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,power_law_1.2,0.08288000226020813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,power_law_1.01,0.10903680324554443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,power_law_1.2,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,power_law_1.01,0.09039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,power_law_1.2,0.10027519464492798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,power_law_1.2,0.10006400346755981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,power_law_1.01,0.09879680275917054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,power_law_1.2,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,power_law_1.01,0.09633280038833618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,power_law_1.2,0.09618560075759888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,power_law_1.01,0.09961599707603455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,power_law_1.2,0.09884160161018371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,power_law_1.01,0.10657919645309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,power_law_1.2,0.09720320105552674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,power_law_1.01,0.11251200437545776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,power_law_1.2,0.11113599538803101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,power_law_1.01,0.13483519554138185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,power_law_1.2,0.11337599754333497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,power_law_1.01,0.156550395488739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,power_law_1.2,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,power_law_1.01,0.18234879970550538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,power_law_1.2,0.1351040005683899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,power_law_1.01,0.08240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,power_law_1.01,0.17765120267868043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,power_law_1.2,0.13693439960479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,power_law_1.01,0.08570240139961242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,power_law_1.01,0.23928320407867432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,power_law_1.2,0.18424960374832153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,power_law_1.01,0.07585920095443725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,power_law_1.01,0.23928320407867432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,power_law_1.2,0.2420032024383545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,power_law_1.01,0.08181120157241821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,power_law_1.01,0.3556096076965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,power_law_1.2,0.23585920333862304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,power_law_1.01,0.08119040131568908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,power_law_1.01,0.4551487922668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,power_law_1.2,0.3657151937484741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,power_law_1.01,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,power_law_1.01,0.6814527988433838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,power_law_1.2,0.48714241981506345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,power_law_1.01,0.08774399757385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,power_law_1.01,0.7547840118408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,power_law_1.01,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,power_law_1.2,0.7089471817016602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,power_law_1.01,1.453343963623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,power_law_1.01,0.0889792025089264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,power_law_1.2,0.9022656440734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,power_law_1.01,1.6829120635986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,power_law_1.01,0.0889792025089264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,power_law_1.2,1.454201602935791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,power_law_1.01,2.7681535720825194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,power_law_1.01,0.09264000058174134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,power_law_1.2,1.8087167739868164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,power_law_1.01,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,power_law_1.01,3.8261375427246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,power_law_1.2,2.787455940246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,power_law_1.01,0.10022399425506592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,power_law_1.01,4.765766525268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,power_law_1.2,3.722137451171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,power_law_1.01,0.11007360219955445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,power_law_1.2,0.0775551974773407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,power_law_1.2,4.974924850463867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,power_law_1.01,0.11642240285873413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,power_law_1.01,7.897586822509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,power_law_1.01,0.12051199674606324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,power_law_1.2,8.253791809082031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,power_law_1.01,17.873202514648437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,power_law_1.01,0.14488960504531861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,power_law_1.2,0.08164479732513427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,power_law_1.01,0.18421119451522827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,power_law_1.2,0.08083840012550354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,power_law_1.2,15.892845153808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,power_law_1.01,0.20448639392852783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,power_law_1.2,0.08247039914131164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,power_law_1.01,0.25383040904998777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,power_law_1.2,0.08328959941864014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,power_law_1.01,0.35399041175842283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,power_law_1.2,0.08737919926643371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,power_law_1.01,0.5591872215270997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,power_law_1.2,0.08921599984169007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,power_law_1.2,0.09045119881629944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,power_law_1.01,0.6880064010620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,power_law_1.2,0.09148160219192505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,power_law_1.01,0.9747136116027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,power_law_1.2,0.096806401014328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,power_law_1.01,1.334560012817383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,power_law_1.2,0.10050560235977173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,power_law_1.01,2.089459228515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,power_law_1.2,0.10294400453567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,power_law_1.01,2.9885183334350587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,power_law_1.2,0.12055679559707641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,power_law_1.01,3.632012939453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,power_law_1.2,0.1314239978790283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,power_law_1.2,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,power_law_1.01,7.345849609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,power_law_1.2,0.17933440208435059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,power_law_1.01,12.676588439941407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,power_law_1.2,0.21169281005859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,power_law_1.2,0.29811840057373046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,power_law_1.2,0.3814079999923706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,power_law_1.2,0.589958381652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,power_law_1.2,0.7302527904510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,power_law_1.2,1.131430435180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,power_law_1.2,1.251039981842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,power_law_1.2,2.150060844421387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,power_law_1.2,2.544300842285156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,power_law_1.2,3.8884735107421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,power_law_1.2,8.21193618774414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,power_law_1.2,13.969952392578126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,power_law_1.01,0.05742719769477844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,power_law_1.01,0.0725823998451233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,power_law_1.01,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,power_law_1.2,0.0574783980846405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,power_law_1.01,0.07626879811286927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,power_law_1.2,0.055232000350952146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,power_law_1.01,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,power_law_1.2,0.07343999743461609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,power_law_1.01,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,power_law_1.2,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,power_law_1.01,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,power_law_1.2,0.08184319734573364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,power_law_1.01,0.08753920197486878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,power_law_1.2,0.08123520016670227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,power_law_1.01,0.09060479998588562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,power_law_1.2,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,power_law_1.2,0.08553599715232849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,power_law_1.01,0.09162880182266235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,power_law_1.2,0.08717439770698547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,power_law_1.01,0.09203839898109437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,power_law_1.2,0.0908415973186493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,power_law_1.01,0.0934719979763031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,power_law_1.2,0.09106559753417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,power_law_1.01,0.10412800312042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,power_law_1.01,0.11292159557342529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,power_law_1.2,0.10458240509033204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,power_law_1.01,0.11169279813766479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,power_law_1.2,0.11338880062103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,power_law_1.01,0.1377087950706482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,power_law_1.2,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,power_law_1.01,0.14650880098342894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,power_law_1.2,0.14595839977264405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,power_law_1.01,0.17169920206069947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,power_law_1.2,0.15352319478988646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,power_law_1.01,0.2134848117828369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,power_law_1.2,0.18465919494628907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.08099200129508972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,power_law_1.01,0.2558464050292969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,power_law_1.2,0.2129215955734253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.0807807981967926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,power_law_1.01,0.36074879169464114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,power_law_1.2,0.2581952095031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.08057600259780884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,power_law_1.01,0.47479681968688964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,power_law_1.2,0.36548480987548826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,power_law_1.01,0.6716224193572998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,power_law_1.2,0.4912384033203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,power_law_1.2,0.6087615966796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,power_law_1.2,0.8609087944030762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.09122560024261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,power_law_1.2,1.3214912414550781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.09470720291137695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,power_law_1.2,1.6698688507080077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.09696639776229858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,power_law_1.2,2.180428886413574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.11314560174942016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,power_law_1.2,4.0463615417480465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.11252479553222657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.12093440294265748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.07959679961204529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,power_law_1.2,7.774739074707031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.15329279899597167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.16309759616851807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.08144639730453491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.18952959775924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.08142719864845276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,power_law_1.01,0.22187519073486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,power_law_1.01,0.2984960079193115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.09044479727745056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,power_law_1.01,0.3574592113494873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,power_law_1.01,0.5051199913024902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,power_law_1.01,0.6724287986755371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.09886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,power_law_1.01,0.9886655807495117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.11134719848632812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.1121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,power_law_1.01,1.246016025543213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.12323839664459228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,power_law_1.01,1.5858367919921874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.15210239887237548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,power_law_1.01,2.5414144515991213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.16336640119552612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,power_law_1.01,5.115385437011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.18424960374832153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,power_law_1.2,0.22194559574127198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,power_law_1.2,0.3013760089874268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,power_law_1.2,0.35793280601501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,power_law_1.2,0.5100863933563232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,power_law_1.2,0.6707776069641114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,power_law_1.2,0.9952704429626464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,power_law_1.2,1.278508758544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,power_law_1.2,1.6104896545410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,power_law_1.2,2.5774911880493163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,power_law_1.2,5.197760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,power_law_1.01,0.1580288052558899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,power_law_1.01,0.2741568088531494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,power_law_1.01,0.16165119409561157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,power_law_1.01,0.11543680429458618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,power_law_1.01,0.1596735954284668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,power_law_1.01,0.1842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,power_law_1.01,0.2196863889694214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,power_law_1.01,0.21263360977172852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,power_law_1.01,0.23401598930358886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,power_law_1.01,0.23075199127197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,power_law_1.01,0.2282815933227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,power_law_1.01,0.2336064100265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,power_law_1.2,0.16147840023040771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,power_law_1.01,0.23095040321350097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,power_law_1.2,0.28781440258026125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,power_law_1.01,0.24793601036071777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,power_law_1.2,0.09778559803962708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,power_law_1.01,0.24131839275360106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,power_law_1.2,0.11683199405670167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,power_law_1.2,0.14058879613876343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,power_law_1.2,0.1503424048423767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,power_law_1.2,0.20858240127563477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,power_law_1.2,0.21349120140075684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,power_law_1.2,0.22025599479675292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,power_law_1.01,0.10888960361480712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,power_law_1.2,0.22291839122772217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,power_law_1.01,0.16459519863128663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,power_law_1.2,0.23725440502166747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,power_law_1.01,0.10643199682235718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,power_law_1.2,0.2395008087158203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,power_law_1.01,0.09782400131225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,power_law_1.2,0.23539199829101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,power_law_1.01,0.13530880212783813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,power_law_1.2,0.23909120559692382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,power_law_1.01,0.14780160188674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,power_law_1.2,0.2542527914047241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,power_law_1.01,0.21846399307250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,power_law_1.2,0.27124478816986086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,power_law_1.01,0.2190783977508545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,power_law_1.2,0.27473280429840086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,power_law_1.01,0.21824638843536376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,power_law_1.2,0.3136447906494141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,power_law_1.01,0.22174079418182374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,power_law_1.2,0.33680000305175783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,power_law_1.01,0.23256959915161132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,power_law_1.2,0.40497279167175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,power_law_1.01,0.23280000686645508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,power_law_1.2,0.41665282249450686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,power_law_1.01,0.2336127996444702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,power_law_1.2,0.5682112216949463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,power_law_1.01,0.24955520629882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,power_law_1.2,0.5895103931427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,power_law_1.01,0.26248319149017335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,power_law_1.2,0.7744448184967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,power_law_1.01,0.26883199214935305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,power_law_1.2,1.1027327537536622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,power_law_1.01,0.26576640605926516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,power_law_1.2,1.710380744934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,power_law_1.01,0.28993279933929444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,power_law_1.2,1.9841791152954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,power_law_1.01,0.3077631950378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,power_law_1.2,2.084550476074219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,power_law_1.01,0.3652928113937378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,power_law_1.01,0.3708159923553467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,power_law_1.2,4.016364669799804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,power_law_1.01,0.45888638496398926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,power_law_1.01,0.5485951900482178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,power_law_1.2,13.3134521484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,power_law_1.01,0.6987135887145997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,power_law_1.01,0.9006527900695801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,power_law_1.01,1.1216383934020997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,power_law_1.01,1.549452781677246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,power_law_1.01,1.816908836364746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,power_law_1.01,2.8702144622802734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,power_law_1.01,5.6728767395019535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,power_law_1.01,0.6675327777862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,power_law_1.01,1.1920127868652344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,power_law_1.01,1.827507209777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,power_law_1.01,2.2729536056518556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,power_law_1.01,3.397510528564453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,power_law_1.01,7.693817901611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,power_law_1.2,0.11068799495697021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,power_law_1.2,0.20448000431060792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,power_law_1.2,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,power_law_1.2,0.10454399585723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,power_law_1.2,0.12747520208358765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,power_law_1.2,0.158188796043396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,power_law_1.2,0.19260159730911255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,power_law_1.2,0.20775680541992186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,power_law_1.2,0.2196415901184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,power_law_1.2,0.22209279537200927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,power_law_1.2,0.23192958831787108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,power_law_1.01,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,power_law_1.2,0.22980480194091796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,power_law_1.01,0.11155200004577637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,power_law_1.2,0.24871680736541749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,power_law_1.01,0.07960320115089417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,power_law_1.2,0.25180160999298096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,power_law_1.2,0.25854079723358153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,power_law_1.01,0.10030080080032348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,power_law_1.2,0.2722752094268799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,power_law_1.01,0.13982080221176146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,power_law_1.01,0.15457279682159425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,power_law_1.2,0.2700160026550293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,power_law_1.01,0.21251840591430665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,power_law_1.2,0.30278398990631106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,power_law_1.01,0.21518080234527587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,power_law_1.2,0.3337088108062744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,power_law_1.01,0.21680641174316406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,power_law_1.2,0.40188798904418943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,power_law_1.01,0.22009599208831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,power_law_1.2,0.43223037719726565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,power_law_1.01,0.23075199127197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,power_law_1.2,0.47031679153442385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,power_law_1.01,0.23668479919433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,power_law_1.2,0.5763967990875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,power_law_1.01,0.2542975902557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,power_law_1.2,0.7969600200653076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,power_law_1.01,0.25408639907836916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,power_law_1.2,1.0181504249572755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,power_law_1.2,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,power_law_1.01,0.2649280071258545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,power_law_1.2,0.1123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,power_law_1.2,1.3050623893737794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,power_law_1.01,0.27333118915557864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,power_law_1.2,0.07381119728088378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,power_law_1.2,1.6868095397949219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,power_law_1.01,0.28441600799560546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,power_law_1.2,0.10041600465774536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,power_law_1.2,2.1078847885131835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,power_law_1.01,0.30714240074157717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,power_law_1.2,0.12334719896316529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,power_law_1.2,3.139462471008301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,power_law_1.01,0.3265984058380127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,power_law_1.2,0.15244799852371216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,power_law_1.01,0.37882239818573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,power_law_1.2,0.20079360008239747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,power_law_1.2,6.933580780029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,power_law_1.01,0.3992831945419312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,power_law_1.2,0.22024960517883302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,power_law_1.01,0.5068223953247071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,power_law_1.2,0.22145919799804686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,power_law_1.01,0.5932223796844482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,power_law_1.2,0.23722879886627196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,power_law_1.01,0.7199999809265136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,power_law_1.2,0.22864000797271727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,power_law_1.01,0.8973504066467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,power_law_1.2,0.2374272108078003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,power_law_1.01,0.26187520027160643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,power_law_1.01,1.2571904182434082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,power_law_1.01,0.27436161041259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,power_law_1.2,0.2476799964904785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,power_law_1.01,1.5445311546325684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,power_law_1.01,0.29320321083068845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,power_law_1.2,0.25915520191192626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,power_law_1.01,0.3138688087463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,power_law_1.2,0.262227201461792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,power_law_1.01,1.9637567520141601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,power_law_1.01,0.37574400901794436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,power_law_1.2,0.273471999168396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,power_law_1.01,3.1923519134521485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,power_law_1.01,0.3910912036895752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,power_law_1.2,0.29109759330749513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,power_law_1.01,5.94158706665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,power_law_1.01,0.4732096195220947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,power_law_1.2,0.32052481174468994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,power_law_1.01,0.5096831798553467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,power_law_1.2,0.34333438873291017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,power_law_1.01,0.7453887939453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,power_law_1.2,0.39022719860076904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,power_law_1.01,0.8924351692199707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,power_law_1.2,0.4391744136810303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,power_law_1.2,0.5391232013702393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,power_law_1.01,1.333779239654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,power_law_1.2,0.6058815956115723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,power_law_1.01,1.643244743347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,power_law_1.2,0.7723904132843018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,power_law_1.01,1.87957763671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,power_law_1.2,0.9165504455566407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,power_law_1.01,2.716396713256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,power_law_1.2,1.2804927825927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,power_law_1.01,6.543692779541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,power_law_1.2,1.6628351211547852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,power_law_1.2,2.2376575469970703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,power_law_1.2,3.272166442871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,power_law_1.2,7.441004943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,power_law_1.01,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,power_law_1.01,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,power_law_1.01,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,power_law_1.01,0.10289920568466186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,power_law_1.01,0.15041279792785645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,power_law_1.01,0.17007999420166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,power_law_1.01,0.22250878810882568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,power_law_1.01,0.23519999980926515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,power_law_1.01,0.24114561080932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,power_law_1.01,0.2501568078994751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,power_law_1.01,0.25630080699920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,power_law_1.01,0.26633601188659667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,power_law_1.01,0.26715519428253176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,power_law_1.01,0.27409920692443845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,power_law_1.2,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,power_law_1.01,0.2843519926071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,power_law_1.2,0.0871616005897522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,power_law_1.01,0.296230411529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,power_law_1.2,0.07692800164222717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,power_law_1.01,0.3201920032501221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,power_law_1.01,0.37426559925079345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,power_law_1.2,0.10008959770202637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,power_law_1.01,0.38962559700012206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,power_law_1.2,0.12547199726104735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,power_law_1.01,0.445740795135498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,power_law_1.2,0.15271040201187133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,power_law_1.01,0.5178239822387696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,power_law_1.2,0.21293439865112304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,power_law_1.01,0.6409152030944825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,power_law_1.2,0.22374401092529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,power_law_1.2,0.23710079193115235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,power_law_1.01,0.7383999824523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,power_law_1.2,0.24896640777587892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,power_law_1.01,0.94967679977417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,power_law_1.2,0.25470719337463377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,power_law_1.01,1.1760576248168946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,power_law_1.2,0.2600127935409546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,power_law_1.01,1.6206655502319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,power_law_1.2,0.2670016050338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,power_law_1.01,1.9502016067504884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,power_law_1.2,0.28049919605255125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,power_law_1.01,2.547999954223633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,power_law_1.2,0.29033598899841306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,power_law_1.01,3.9951168060302735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,power_law_1.2,0.3159359931945801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,power_law_1.2,0.32309761047363283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,power_law_1.01,7.091078186035157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,power_law_1.2,0.35765120983123777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,power_law_1.2,0.40052480697631837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,power_law_1.2,0.45518078804016116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,power_law_1.2,0.5317952156066894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,power_law_1.2,0.6454720020294189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,power_law_1.2,0.7949632167816162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,power_law_1.2,0.9682175636291503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.06874240040779114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.08305919766426087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,power_law_1.2,1.2522944450378417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.11011840105056762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,power_law_1.2,1.6833856582641602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,power_law_1.2,2.096256065368652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,power_law_1.01,0.18957439661026002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.07381119728088378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,power_law_1.2,2.5181440353393554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,power_law_1.01,0.24137599468231202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,power_law_1.2,4.027526473999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,power_law_1.01,0.26064000129699705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.11106560230255128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,power_law_1.01,0.27026560306549074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.1360703945159912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,power_law_1.2,8.753689575195313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,power_law_1.01,0.2751744031906128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.1676095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,power_law_1.01,0.28460159301757815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,power_law_1.2,0.24030721187591553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,power_law_1.01,0.29726719856262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,power_law_1.2,0.25772800445556643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,power_law_1.01,0.30323200225830077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,power_law_1.2,0.2636607885360718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,power_law_1.01,0.3187903881072998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,power_law_1.2,0.26960000991821287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,power_law_1.01,0.33584640026092527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,power_law_1.01,0.07667199969291687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,power_law_1.2,0.28638079166412356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,power_law_1.01,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,power_law_1.01,0.3443903923034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,power_law_1.2,0.29601919651031494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,power_law_1.01,0.05086719989776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,power_law_1.01,0.37512319087982177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,power_law_1.2,0.3136320114135742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,power_law_1.01,0.05805439949035644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,power_law_1.01,0.44208641052246095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,power_law_1.2,0.32529919147491454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,power_law_1.01,0.06357759833335877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,power_law_1.01,0.5084479808807373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,power_law_1.2,0.3490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,power_law_1.01,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,power_law_1.01,0.6202688217163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,power_law_1.01,0.07423999905586243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,power_law_1.2,0.3642175912857056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,power_law_1.01,0.7171135902404785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,power_law_1.01,0.07566720247268677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,power_law_1.2,0.3851072072982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,power_law_1.01,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,power_law_1.01,0.9321663856506348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,power_law_1.2,0.46251521110534666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,power_law_1.01,0.07934719920158387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,power_law_1.01,1.0542271614074707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,power_law_1.2,0.5300992012023926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,power_law_1.01,1.390726375579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,power_law_1.2,0.6478528022766114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,power_law_1.01,0.09122560024261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,power_law_1.01,1.7628288269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,power_law_1.2,0.7371583938598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,power_law_1.01,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,power_law_1.2,0.9481023788452149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,power_law_1.01,2.410009574890137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,power_law_1.01,0.09962239861488342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,power_law_1.2,1.0744511604309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,power_law_1.01,3.065158462524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,power_law_1.01,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,power_law_1.2,0.07715839743614197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,power_law_1.2,1.3890111923217774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,power_law_1.01,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,power_law_1.01,3.670969772338867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,power_law_1.01,0.11539839506149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,power_law_1.2,1.778758430480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,power_law_1.2,0.05175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,power_law_1.01,5.603039932250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,power_law_1.2,0.055219197273254396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,power_law_1.2,2.4091392517089845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,power_law_1.01,0.15244799852371216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,power_law_1.2,0.06117759943008423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,power_law_1.01,10.824832153320312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,power_law_1.2,3.043814468383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,power_law_1.01,0.16885119676589966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,power_law_1.2,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,power_law_1.01,0.21063039302825928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,power_law_1.2,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,power_law_1.2,3.699987030029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,power_law_1.01,0.25179519653320315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,power_law_1.2,0.07651200294494628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,power_law_1.2,5.606681442260742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,power_law_1.01,0.3508991956710815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,power_law_1.2,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,power_law_1.01,0.39514880180358886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,power_law_1.2,10.780121612548829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,power_law_1.2,0.08307200074195861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,power_law_1.01,0.6847296237945557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,power_law_1.2,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,power_law_1.01,0.8096511840820313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,power_law_1.2,0.09352959990501404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,power_law_1.01,0.9820927619934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,power_law_1.2,0.09292160272598267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,power_law_1.01,2.1336896896362303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,power_law_1.2,0.09908480048179627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,power_law_1.2,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,power_law_1.01,4.077433776855469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,power_law_1.2,0.10887680053710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,power_law_1.2,0.13018239736557008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,power_law_1.2,0.12813440561294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,power_law_1.2,0.1588544011116028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,power_law_1.2,0.1817919969558716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,power_law_1.2,0.23751039505004884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,power_law_1.2,0.3028287887573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,power_law_1.2,0.3990976095199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,power_law_1.2,0.6034751892089844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,power_law_1.2,0.8330623626708984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,power_law_1.2,1.1764991760253907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,power_law_1.2,1.4288127899169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,power_law_1.01,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,power_law_1.01,0.04661760032176972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,power_law_1.2,3.3135936737060545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,power_law_1.01,0.05502079725265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,power_law_1.2,5.901440048217774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,power_law_1.01,0.056454402208328244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,power_law_1.01,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,power_law_1.01,0.0711296021938324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,power_law_1.01,0.07364479899406433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,power_law_1.01,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,power_law_1.01,0.08157439827919007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,power_law_1.01,0.09168639779090881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,power_law_1.01,0.08819839954376221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,power_law_1.01,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,power_law_1.01,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,power_law_1.01,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,power_law_1.01,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,power_law_1.01,0.04248960018157959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,power_law_1.01,0.09816319942474365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,power_law_1.01,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,power_law_1.01,0.11378560066223145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,power_law_1.01,0.06460800170898437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,power_law_1.01,0.11790080070495605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,power_law_1.01,0.0742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,power_law_1.01,0.14001280069351196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,power_law_1.01,0.07812479734420777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,power_law_1.01,0.15394560098648072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,power_law_1.01,0.07994880080223084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,power_law_1.01,0.1985856056213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,power_law_1.01,0.08241919875144958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,power_law_1.01,0.24813439846038818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,power_law_1.01,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,power_law_1.01,0.3097856044769287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,power_law_1.01,0.09123200178146362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,power_law_1.01,0.43553919792175294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,power_law_1.01,0.09164800047874451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,power_law_1.01,0.5596415996551514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,power_law_1.01,0.6409471988677978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,power_law_1.01,0.09225599765777588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,power_law_1.01,0.8488127708435058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,power_law_1.01,0.10126719474792481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,power_law_1.2,0.04090240001678467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,power_law_1.01,0.1082111954689026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,power_law_1.01,1.4230655670166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,power_law_1.01,0.11027840375900269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,power_law_1.01,2.7534656524658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,power_law_1.01,0.11990400552749633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,power_law_1.01,0.13731199502944946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,power_law_1.2,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,power_law_1.01,0.15859199762344361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,power_law_1.2,0.0695680022239685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,power_law_1.01,0.17416319847106934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,power_law_1.2,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,power_law_1.01,0.21738879680633544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,power_law_1.2,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,power_law_1.01,0.2728895902633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,power_law_1.2,0.08124799728393554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,power_law_1.01,0.3457920074462891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,power_law_1.2,0.08408960103988647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,power_law_1.01,0.4350719928741455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,power_law_1.2,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,power_law_1.01,0.5878592014312745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,power_law_1.01,0.8133567810058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,power_law_1.2,0.09045119881629944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,power_law_1.01,0.9648896217346191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,power_law_1.2,0.10068479776382447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,power_law_1.01,1.5223551750183106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,power_law_1.2,0.11747839450836181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,power_law_1.01,2.8726335525512696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,power_law_1.2,0.11235840320587158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,power_law_1.2,0.12569600343704224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,power_law_1.2,0.1355072021484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,power_law_1.2,0.16581759452819825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,power_law_1.2,0.1754431962966919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,power_law_1.2,0.2321727991104126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,power_law_1.2,0.2798975944519043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,power_law_1.2,0.3997056007385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,power_law_1.2,0.42775678634643555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,power_law_1.2,0.7318975925445557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,power_law_1.2,0.8924480438232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,power_law_1.2,1.298572826385498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,power_law_1.2,2.284876823425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,power_law_1.2,3.7610816955566406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,power_law_1.01,0.038227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,power_law_1.01,0.042054399847984314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,power_law_1.01,0.05392640233039856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,power_law_1.01,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,power_law_1.01,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,power_law_1.01,0.07898880243301391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,power_law_1.01,0.08062080144882203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,power_law_1.01,0.08594560027122497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,power_law_1.01,0.09201920032501221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,power_law_1.01,0.09905279874801635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,power_law_1.01,0.10398080348968505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,power_law_1.01,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,power_law_1.01,0.11133439540863037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,power_law_1.01,0.11400959491729737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,power_law_1.01,0.14410239458084106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,power_law_1.2,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,power_law_1.01,0.16417920589447021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,power_law_1.2,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,power_law_1.01,0.17093759775161743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,power_law_1.2,0.045561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,power_law_1.01,0.1965376019477844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,power_law_1.01,0.23256959915161132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,power_law_1.01,0.2972415924072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,power_law_1.01,0.36796159744262696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,power_law_1.01,0.4916543960571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,power_law_1.01,0.5821887969970703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,power_law_1.01,0.8351039886474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,power_law_1.01,1.0521984100341797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,power_law_1.01,1.2993856430053712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,power_law_1.01,2.141926383972168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,power_law_1.01,4.201606369018554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.037190398573875426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.07200639843940734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.096806401014328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.10069760084152221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.10316159725189208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.10601600408554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.1326143980026245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.15210239887237548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.15823999643325806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.165830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.1979840040206909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.22829439640045165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,power_law_1.01,0.2923968076705933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,power_law_1.01,0.3401087999343872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,power_law_1.01,0.4444863796234131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,power_law_1.01,0.5506368160247803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,power_law_1.01,0.7368127822875976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,power_law_1.01,0.9182592391967773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,power_law_1.01,1.3022527694702148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,power_law_1.01,1.6383295059204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,power_law_1.01,2.0206911087036135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,power_law_1.01,3.1392448425292967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,power_law_1.01,6.089651107788086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,power_law_1.2,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,power_law_1.2,0.04129279851913452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,power_law_1.2,0.05864319801330566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,power_law_1.2,0.05624960064888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,power_law_1.2,0.06403840184211732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,power_law_1.2,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,power_law_1.2,0.09658880233764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,power_law_1.2,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,power_law_1.2,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,power_law_1.2,0.05496960282325745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,power_law_1.2,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,power_law_1.2,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,power_law_1.2,0.10662399530410767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,power_law_1.2,0.10828160047531128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,power_law_1.2,0.0738048017024994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,power_law_1.2,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,power_law_1.2,0.07463039755821228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,power_law_1.2,0.11708159446716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,power_law_1.2,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,power_law_1.2,0.1215872049331665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,power_law_1.2,0.08057600259780884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,power_law_1.2,0.13264000415802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,power_law_1.2,0.08466560244560242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,power_law_1.2,0.14410879611968994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,power_law_1.2,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,power_law_1.2,0.15189119577407836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,power_law_1.2,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,power_law_1.2,0.17093759775161743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,power_law_1.2,0.08712319731712341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,power_law_1.2,0.1994047999382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,power_law_1.2,0.09756159782409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,power_law_1.2,0.22970879077911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,power_law_1.2,0.09941759705543518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,power_law_1.2,0.29443199634552003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,power_law_1.2,0.10535039901733398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,power_law_1.2,0.3392895936965942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,power_law_1.2,0.11844480037689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,power_law_1.2,0.4400320053100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,power_law_1.2,0.12501120567321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,power_law_1.2,0.5567808151245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,power_law_1.2,0.15449600219726561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,power_law_1.2,0.1786687970161438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,power_law_1.2,0.7310719966888428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,power_law_1.2,0.22004480361938478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,power_law_1.2,0.9239744186401367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,power_law_1.2,0.24973440170288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,power_law_1.2,1.309216022491455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,power_law_1.2,0.39575040340423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,power_law_1.2,1.6403648376464843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,power_law_1.2,0.4170559883117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,power_law_1.2,2.0260032653808593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,power_law_1.2,0.7383872032165527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,power_law_1.2,3.1175935745239256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,power_law_1.2,0.8776512145996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,power_law_1.2,6.076537704467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,power_law_1.2,1.0451775550842286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,power_law_1.2,2.0947776794433595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,power_law_1.2,3.498681640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,power_law_1.01,0.19141759872436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,power_law_1.01,0.17709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,power_law_1.01,0.09660800099372864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,power_law_1.01,0.11707520484924316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,power_law_1.01,0.13553279638290405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,power_law_1.01,0.18078080415725709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,power_law_1.01,0.17564159631729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,power_law_1.01,0.18467199802398682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,power_law_1.01,0.18732800483703613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,power_law_1.01,0.18814719915390016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,power_law_1.01,0.19203200340270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,power_law_1.01,0.19326720237731934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,power_law_1.01,0.19736319780349731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,power_law_1.01,0.20391039848327636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,power_law_1.01,0.21415679454803466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,power_law_1.01,0.22050559520721436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,power_law_1.01,0.21989119052886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,power_law_1.01,0.24854400157928466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,power_law_1.01,0.2792831897735596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,power_law_1.01,0.35559680461883547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,power_law_1.01,0.3648895978927612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,power_law_1.01,0.4666816234588623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,power_law_1.01,0.5636799812316895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,power_law_1.01,0.7241087913513183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,power_law_1.01,0.9862591743469238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,power_law_1.01,1.3735296249389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,power_law_1.01,1.8013439178466797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,power_law_1.01,2.2128000259399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,power_law_1.01,3.492940902709961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,power_law_1.01,7.2737983703613285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,power_law_1.2,0.05310080051422119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,power_law_1.2,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,power_law_1.2,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,power_law_1.2,0.08447359800338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,power_law_1.2,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,power_law_1.2,0.19243520498275757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,power_law_1.2,0.09080320000648498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,power_law_1.2,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,power_law_1.2,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,power_law_1.2,0.09738879799842834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,power_law_1.2,0.09536640048027038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,power_law_1.2,0.1020799994468689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,power_law_1.01,0.11681280136108399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,power_law_1.2,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,power_law_1.01,0.13976320028305053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,power_law_1.2,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,power_law_1.2,0.10699520111083985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,power_law_1.2,0.10331519842147827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,power_law_1.2,0.16622719764709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,power_law_1.01,0.09510400295257568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,power_law_1.2,0.11251200437545776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,power_law_1.2,0.1703104019165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,power_law_1.01,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,power_law_1.2,0.11927679777145386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,power_law_1.2,0.187116801738739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,power_law_1.01,0.12049920558929443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,power_law_1.2,0.14673279523849486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,power_law_1.2,0.17891199588775636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,power_law_1.01,0.16677759885787963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,power_law_1.2,0.17210880517959595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,power_law_1.2,0.19816960096359254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,power_law_1.01,0.17560319900512694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,power_law_1.2,0.17255680561065673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,power_law_1.2,0.1994047999382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,power_law_1.01,0.18112000226974487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,power_law_1.2,0.21103360652923583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,power_law_1.2,0.1989824056625366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,power_law_1.01,0.1786687970161438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,power_law_1.2,0.24094080924987793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,power_law_1.2,0.1998080015182495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,power_law_1.01,0.18317439556121826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,power_law_1.2,0.30933759212493894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,power_law_1.2,0.20227839946746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,power_law_1.01,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,power_law_1.2,0.38428800106048583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,power_law_1.2,0.218451189994812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,power_law_1.01,0.19156479835510254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,power_law_1.2,0.4993919849395752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,power_law_1.2,0.22499840259552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,power_law_1.01,0.19464319944381714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,power_law_1.2,0.6962111949920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,power_law_1.2,0.2368704080581665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,power_law_1.01,0.2007807970046997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,power_law_1.2,0.9120448112487793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,power_law_1.2,0.27619199752807616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,power_law_1.01,0.21020801067352296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,power_law_1.2,1.1608832359313965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,power_law_1.2,0.29402239322662355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,power_law_1.01,0.21553280353546142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,power_law_1.2,0.40010881423950195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,power_law_1.01,0.2253567934036255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,power_law_1.2,1.477683162689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,power_law_1.2,0.46175360679626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,power_law_1.01,0.2440000057220459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,power_law_1.2,2.732703971862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,power_law_1.2,0.5117119789123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,power_law_1.01,0.26857600212097166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,power_law_1.2,4.500761413574219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,power_law_1.2,0.6577343940734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,power_law_1.01,0.30925440788269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,power_law_1.01,0.3322688102722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,power_law_1.2,0.9387007713317871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,power_law_1.01,0.41971840858459475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,power_law_1.2,1.1384127616882325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,power_law_1.01,0.5100287914276123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,power_law_1.2,1.836992073059082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,power_law_1.01,0.6478591918945312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,power_law_1.2,2.7628864288330077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,power_law_1.01,0.8202943801879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,power_law_1.2,2.9799423217773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,power_law_1.01,1.1145983695983888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,power_law_1.2,4.529478454589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,power_law_1.01,1.5870783805847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,power_law_1.01,1.6681791305541993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,power_law_1.2,10.896851348876954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,power_law_1.01,2.9245567321777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,power_law_1.01,6.120320129394531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,power_law_1.2,0.11380480527877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,power_law_1.2,0.07837439775466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,power_law_1.2,0.07652480006217957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,power_law_1.2,0.10274560451507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,power_law_1.2,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,power_law_1.2,0.1615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,power_law_1.2,0.17238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,power_law_1.2,0.1746240019798279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,power_law_1.2,0.17459839582443237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,power_law_1.2,0.1891711950302124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,power_law_1.2,0.1881600022315979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,power_law_1.2,0.1858944058418274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,power_law_1.2,0.19893120527267455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,power_law_1.2,0.20432639122009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,power_law_1.2,0.20945279598236083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,power_law_1.2,0.21702399253845214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,power_law_1.2,0.2256319999694824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,power_law_1.2,0.2518336057662964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,power_law_1.2,0.28337280750274657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,power_law_1.2,0.3214783906936646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,power_law_1.2,0.3714495897293091
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,power_law_1.2,0.4957568168640137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,power_law_1.2,0.5457215785980225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,power_law_1.2,0.7933311939239502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,power_law_1.2,0.9125247955322265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,power_law_1.2,1.5583935737609864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,power_law_1.2,1.9309951782226562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,power_law_1.2,2.7407743453979494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,power_law_1.2,3.8049217224121095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,power_law_1.2,8.605843353271485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,power_law_1.01,0.08938239812850952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,power_law_1.01,0.10289920568466186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,power_law_1.01,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,power_law_1.01,0.10024319887161255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,power_law_1.01,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,power_law_1.01,0.1672063946723938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,power_law_1.01,0.17212159633636476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,power_law_1.01,0.18439680337905884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,power_law_1.01,0.18236160278320312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,power_law_1.01,0.187283194065094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,power_law_1.01,0.19465600252151488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,power_law_1.01,0.19956480264663695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,power_law_1.2,0.08942080140113831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,power_law_1.01,0.19895039796829223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,power_law_1.01,0.20592000484466552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,power_law_1.01,0.21144320964813232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,power_law_1.2,0.0906495988368988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,power_law_1.01,0.2204416036605835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,power_law_1.2,0.11318399906158447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,power_law_1.01,0.2284480094909668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,power_law_1.2,0.16581120491027831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,power_law_1.01,0.24994559288024903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,power_law_1.2,0.1764672040939331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,power_law_1.01,0.27491838932037355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,power_law_1.2,0.17278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,power_law_1.01,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,power_law_1.01,0.3175168037414551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,power_law_1.2,0.18875520229339598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,power_law_1.01,0.07443199753761291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,power_law_1.01,0.3447551965713501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,power_law_1.2,0.18630399703979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,power_law_1.01,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,power_law_1.01,0.41828479766845705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,power_law_1.2,0.19039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,power_law_1.01,0.0961408019065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,power_law_1.01,0.5087999820709228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,power_law_1.2,0.1998080015182495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,power_law_1.01,0.11723519563674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,power_law_1.2,0.20247039794921876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,power_law_1.01,0.6226880073547363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,power_law_1.01,0.16575360298156738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,power_law_1.2,0.2153536081314087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,power_law_1.01,0.8633279800415039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,power_law_1.01,0.1790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,power_law_1.2,0.22251520156860352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,power_law_1.01,0.19219199419021607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,power_law_1.01,1.1559679985046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,power_law_1.2,0.22910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,power_law_1.01,0.19587199687957763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,power_law_1.01,1.4883456230163574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,power_law_1.2,0.24343039989471435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,power_law_1.01,0.20057599544525145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,power_law_1.01,1.91210880279541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,power_law_1.2,0.2686271905899048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,power_law_1.01,0.2056960105895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,power_law_1.01,3.0274303436279295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,power_law_1.2,0.28009600639343263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,power_law_1.01,0.21266560554504393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,power_law_1.2,0.3185983896255493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,power_law_1.01,0.20753920078277588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,power_law_1.01,6.188320159912109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,power_law_1.2,0.3529855966567993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,power_law_1.01,0.21388800144195558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,power_law_1.2,0.4584767818450928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,power_law_1.01,0.23417599201202394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,power_law_1.01,0.23539199829101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,power_law_1.2,0.5358911991119385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,power_law_1.01,0.2566911935806274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,power_law_1.2,0.7564608097076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,power_law_1.01,0.282092809677124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,power_law_1.2,0.910041618347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,power_law_1.01,0.3111680030822754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,power_law_1.2,1.258022403717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,power_law_1.01,0.3625727891921997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,power_law_1.2,1.75097599029541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,power_law_1.01,0.4154240131378174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,power_law_1.2,2.1077247619628907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,power_law_1.01,0.5116672039031982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,power_law_1.2,3.32608642578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,power_law_1.01,0.668345594406128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,power_law_1.01,0.8723263740539551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,power_law_1.2,9.113926696777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,power_law_1.01,1.0050368309020996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,power_law_1.01,1.407046413421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,power_law_1.01,1.8184896469116212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,power_law_1.2,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,power_law_1.01,2.1689023971557617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,power_law_1.2,0.06709120273590088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,power_law_1.01,3.48803825378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,power_law_1.2,0.07571200132369996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,power_law_1.2,0.09290239810943604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,power_law_1.01,7.091481781005859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,power_law_1.2,0.11380480527877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,power_law_1.2,0.16828160285949706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,power_law_1.2,0.18261760473251343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,power_law_1.2,0.18672000169754027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,power_law_1.2,0.1965376019477844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,power_law_1.2,0.19911680221557618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,power_law_1.2,0.20597119331359864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,power_law_1.2,0.20719358921051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,power_law_1.2,0.21496961116790772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,power_law_1.2,0.22726399898529054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,power_law_1.2,0.2350464105606079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,power_law_1.2,0.2356544017791748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,power_law_1.2,0.2684288024902344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,power_law_1.2,0.29361920356750487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,power_law_1.2,0.31963520050048827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,power_law_1.2,0.38085761070251467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,power_law_1.2,0.4388160228729248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,power_law_1.2,0.5342207908630371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,power_law_1.2,0.6884736061096192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,power_law_1.2,0.9112895965576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,power_law_1.2,1.0867839813232423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,power_law_1.2,1.4681344032287598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,power_law_1.2,2.0702592849731447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,power_law_1.2,2.5227840423583983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,power_law_1.2,3.81343994140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,power_law_1.2,8.610733032226562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.07013760209083557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.13690240383148194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,power_law_1.01,0.19211519956588746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,power_law_1.01,0.20648961067199706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,power_law_1.01,0.21758720874786378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,power_law_1.01,0.21473920345306396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,power_law_1.01,0.22578558921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,power_law_1.01,0.2294719934463501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,power_law_1.01,0.16472959518432617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,power_law_1.01,0.23827838897705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,power_law_1.01,0.2716480016708374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,power_law_1.01,0.24728960990905763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,power_law_1.01,0.25978240966796873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,power_law_1.01,0.3890048027038574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,power_law_1.01,0.27924480438232424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,power_law_1.01,0.12336000204086303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,power_law_1.2,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,power_law_1.01,0.2921344041824341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.08307200074195861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,power_law_1.01,0.16432000398635865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,power_law_1.01,0.32366719245910647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.10540159940719604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,power_law_1.01,0.3873728036880493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,power_law_1.01,0.20078721046447753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.12279679775238037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,power_law_1.01,0.43427200317382814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,power_law_1.01,0.23763198852539064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,power_law_1.2,0.19100799560546874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,power_law_1.01,0.5518144130706787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,power_law_1.01,0.2751231908798218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,power_law_1.2,0.2028736114501953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,power_law_1.01,0.5956352233886719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,power_law_1.01,0.2906816005706787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,power_law_1.2,0.21374719142913817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,power_law_1.01,0.7670527935028076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,power_law_1.2,0.2213184118270874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,power_law_1.01,0.9653056144714356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,power_law_1.01,0.27983999252319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,power_law_1.2,0.22581760883331298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,power_law_1.01,1.2651328086853026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,power_law_1.01,0.29827840328216554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,power_law_1.2,0.24097919464111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,power_law_1.01,1.555942440032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,power_law_1.01,0.2947776079177856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,power_law_1.2,0.24732160568237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,power_law_1.01,2.156217575073242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,power_law_1.01,0.3201855897903442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,power_law_1.2,0.2547008037567139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,power_law_1.01,2.7159360885620116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,power_law_1.2,0.2676095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,power_law_1.01,0.29662721157073973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,power_law_1.01,3.3389312744140627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,power_law_1.2,0.28412799835205077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,power_law_1.01,0.3267263889312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,power_law_1.2,0.2980992078781128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,power_law_1.01,5.171072006225586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,power_law_1.01,0.3119679927825928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,power_law_1.2,0.32187519073486326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,power_law_1.01,0.34393599033355715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,power_law_1.2,0.4013376235961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,power_law_1.01,10.386739349365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,power_law_1.2,0.44250240325927737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,power_law_1.01,0.35477120876312257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,power_law_1.2,0.5608640193939209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,power_law_1.01,0.3701567888259888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,power_law_1.2,0.15762560367584227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,power_law_1.2,0.6047039985656738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,power_law_1.01,0.4180736064910889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,power_law_1.2,0.2829567909240723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,power_law_1.2,0.768339204788208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,power_law_1.2,0.21986560821533202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,power_law_1.01,0.4916031837463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,power_law_1.2,0.9846079826354981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,power_law_1.2,0.13222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,power_law_1.01,0.5731071949005127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,power_law_1.2,1.2780799865722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,power_law_1.2,0.16316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,power_law_1.01,0.6210368156433106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,power_law_1.2,1.5600831985473633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,power_law_1.2,0.19203840494155883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,power_law_1.2,2.152979278564453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,power_law_1.01,0.7977791786193847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,power_law_1.2,0.21702399253845214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,power_law_1.2,2.755513572692871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,power_law_1.01,0.9607935905456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,power_law_1.2,0.2616703987121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,power_law_1.2,3.3987777709960936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,power_law_1.01,1.335366439819336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,power_law_1.2,0.2768127918243408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,power_law_1.2,5.314271926879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,power_law_1.01,1.5702783584594726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,power_law_1.2,0.25886719226837157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,power_law_1.2,0.28501760959625244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,power_law_1.01,1.922662353515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,power_law_1.2,10.700211334228516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,power_law_1.2,0.2854399919509888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,power_law_1.01,2.8639936447143555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,power_law_1.2,0.2927999973297119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,power_law_1.2,0.31493120193481444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,power_law_1.01,6.466828918457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,power_law_1.2,0.3009471893310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,power_law_1.2,0.33743360042572024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,power_law_1.2,0.3280256032943726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,power_law_1.2,0.37431039810180666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,power_law_1.2,0.42408318519592286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,power_law_1.2,0.48265600204467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,power_law_1.2,0.5596543788909912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,power_law_1.2,0.69585280418396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,power_law_1.2,0.7167551994323731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,power_law_1.2,0.8936896324157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,power_law_1.2,1.2416383743286132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,power_law_1.2,1.4912704467773437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,power_law_1.2,1.9420480728149414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,power_law_1.2,2.9052288055419924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,power_law_1.2,3.492172622680664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,power_law_1.2,10.400640106201172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,power_law_1.01,0.11191680431365966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,power_law_1.01,0.16803200244903566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,power_law_1.01,0.2655168056488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,power_law_1.01,0.11314560174942016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,power_law_1.01,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,power_law_1.01,0.19137920141220094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,power_law_1.01,0.2048896074295044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,power_law_1.01,0.2630592107772827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,power_law_1.01,0.2683840036392212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,power_law_1.01,0.2952127933502197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,power_law_1.01,0.28784000873565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,power_law_1.01,0.306060791015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,power_law_1.01,0.29173119068145753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,power_law_1.01,0.29971840381622317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,power_law_1.01,0.3283519983291626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,power_law_1.2,0.10968960523605346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,power_law_1.01,0.32734720706939696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,power_law_1.2,0.16458879709243773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,power_law_1.01,0.34620161056518556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,power_law_1.2,0.17134720087051392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,power_law_1.01,0.36627840995788574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,power_law_1.2,0.10150400400161744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,power_law_1.01,0.4055808067321777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,power_law_1.2,0.13059200048446656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,power_law_1.01,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,power_law_1.01,0.44245758056640627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,power_law_1.2,0.1713536024093628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,power_law_1.01,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,power_law_1.01,0.47072639465332033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,power_law_1.2,0.20186240673065187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,power_law_1.01,0.1716928005218506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,power_law_1.01,0.5542463779449462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,power_law_1.2,0.24712319374084474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,power_law_1.01,0.09573119878768921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,power_law_1.01,0.5899007797241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,power_law_1.2,0.24978559017181395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,power_law_1.01,0.1399616003036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,power_law_1.01,0.7564095973968505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,power_law_1.2,0.27764480113983153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,power_law_1.01,0.18481279611587526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,power_law_1.01,0.9509823799133301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,power_law_1.2,0.26986238956451414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,power_law_1.01,0.2075455904006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,power_law_1.2,0.28064000606536865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,power_law_1.01,1.2620736122131349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,power_law_1.01,0.26898560523986814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,power_law_1.2,0.3128511905670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,power_law_1.01,1.5911808013916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,power_law_1.01,0.26243200302124026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,power_law_1.2,0.3048831939697266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,power_law_1.01,1.923161506652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,power_law_1.01,0.28618879318237306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,power_law_1.2,0.32965118885040284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,power_law_1.01,2.9766399383544924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,power_law_1.01,0.28945279121398926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,power_law_1.2,0.3208575963973999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,power_law_1.01,0.30278398990631106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,power_law_1.2,0.3474751949310303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,power_law_1.01,5.842758560180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,power_law_1.01,0.30462079048156737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,power_law_1.2,0.3614016056060791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,power_law_1.01,0.31629440784454343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,power_law_1.2,0.4062464237213135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,power_law_1.01,0.32591359615325927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,power_law_1.2,0.4420928001403809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,power_law_1.2,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,power_law_1.01,0.3453632116317749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,power_law_1.2,0.5309760093688964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,power_law_1.2,0.11360000371932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,power_law_1.01,0.34577279090881347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,power_law_1.2,0.6425920009613038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,power_law_1.2,0.09121919870376587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,power_law_1.01,0.39166719913482667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,power_law_1.2,0.666758394241333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,power_law_1.2,0.09475839734077454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,power_law_1.01,0.42831997871398925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,power_law_1.2,0.13530880212783813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,power_law_1.2,0.7716159820556641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,power_law_1.01,0.49201278686523436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,power_law_1.2,0.17850879430770875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,power_law_1.2,1.0427712440490722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,power_law_1.01,0.5165760040283203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,power_law_1.2,0.1903872013092041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,power_law_1.2,1.4050368309020995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,power_law_1.01,0.6210368156433106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,power_law_1.2,0.263923192024231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,power_law_1.2,1.7853567123413085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,power_law_1.2,0.25736958980560304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,power_law_1.01,0.6716159820556641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,power_law_1.2,2.432537651062012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,power_law_1.2,0.27681920528411863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,power_law_1.01,0.8686271667480469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,power_law_1.2,3.9249088287353517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,power_law_1.2,0.289734411239624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,power_law_1.01,1.0124095916748046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,power_law_1.2,0.28707199096679686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,power_law_1.01,1.330470371246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,power_law_1.2,7.0884544372558596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,power_law_1.2,0.29852159023284913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,power_law_1.01,1.747635269165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,power_law_1.2,0.31902079582214354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,power_law_1.01,2.022271919250488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,power_law_1.2,0.32413439750671386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,power_law_1.01,3.4028350830078127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,power_law_1.2,0.33600640296936035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,power_law_1.2,0.3544447898864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,power_law_1.01,5.733868789672852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,power_law_1.2,0.38925440311431886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,power_law_1.2,0.43834238052368163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,power_law_1.2,0.5210752010345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,power_law_1.2,0.5190976142883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,power_law_1.2,0.6288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,power_law_1.2,0.7650752067565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,power_law_1.2,0.9661120414733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,power_law_1.2,1.1294143676757813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,power_law_1.2,1.455027198791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,power_law_1.2,1.884294319152832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,power_law_1.2,2.1898687362670897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,power_law_1.2,3.4388927459716796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,power_law_1.2,7.400531005859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,power_law_1.01,0.07088000178337098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,power_law_1.01,0.0906175971031189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,power_law_1.01,0.12298879623413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,power_law_1.01,0.09306880235671997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,power_law_1.01,0.1410048007965088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,power_law_1.01,0.18521599769592284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,power_law_1.01,0.222707200050354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,power_law_1.01,0.27616000175476074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,power_law_1.01,0.29418239593505857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,power_law_1.01,0.3070847988128662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,power_law_1.01,0.3093247890472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,power_law_1.01,0.32347519397735597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,power_law_1.01,0.3310528039932251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,power_law_1.01,0.34907519817352295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,power_law_1.01,0.3548095941543579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,power_law_1.01,0.37405440807342527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,power_law_1.01,0.38798720836639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,power_law_1.01,0.4211455821990967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,power_law_1.2,0.06504960060119629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,power_law_1.01,0.46456317901611327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,power_law_1.2,0.08799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,power_law_1.01,0.540339183807373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,power_law_1.2,0.08757759928703308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,power_law_1.01,0.5944191932678222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,power_law_1.2,0.10046720504760742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,power_law_1.01,0.7445375919342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,power_law_1.2,0.13756799697875977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,power_law_1.2,0.1764672040939331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,power_law_1.01,0.8657792091369629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,power_law_1.2,0.2075968027114868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,power_law_1.01,1.0961855888366698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,power_law_1.2,0.2604351997375488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,power_law_1.01,1.3460224151611329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,power_law_1.2,0.28991360664367677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,power_law_1.01,1.7488704681396485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,power_law_1.2,0.27682559490203856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,power_law_1.01,2.1877504348754884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,power_law_1.2,0.30506880283355714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,power_law_1.01,2.6495807647705076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,power_law_1.2,0.32782080173492434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,power_law_1.01,4.276095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,power_law_1.2,0.3331392049789429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,power_law_1.2,0.3439807891845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,power_law_1.01,7.7179710388183596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,power_law_1.2,0.3595583915710449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,power_law_1.2,0.3668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,power_law_1.2,0.38877439498901367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,power_law_1.2,0.4252863883972168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,power_law_1.2,0.46421117782592775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.07646719813346863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,power_law_1.2,0.5379519939422608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.10001920461654663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,power_law_1.2,0.6360383987426758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.10903680324554443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,power_law_1.2,0.7879871845245361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.16432640552520753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,power_law_1.01,0.2118527889251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,power_law_1.2,0.9067839622497559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,power_law_1.01,0.25075840950012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,power_law_1.2,1.131436824798584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,power_law_1.01,0.3150592088699341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,power_law_1.2,1.3309120178222655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,power_law_1.01,0.047603198885917665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,power_law_1.01,0.32652161121368406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,power_law_1.2,1.8197696685791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,power_law_1.01,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,power_law_1.01,0.3326848030090332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,power_law_1.01,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,power_law_1.2,2.3207168579101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,power_law_1.01,0.3506880044937134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,power_law_1.2,2.9209663391113283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,power_law_1.01,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,power_law_1.01,0.368505597114563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,power_law_1.01,0.049619200825691226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,power_law_1.2,4.118854522705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,power_law_1.01,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,power_law_1.01,0.3799871921539307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.06895359754562377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,power_law_1.01,0.05003520250320435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.07247999906539918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,power_law_1.01,0.3920703887939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,power_law_1.01,0.05170559883117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,power_law_1.2,8.94211196899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,power_law_1.01,0.05578240156173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,power_law_1.01,0.42032642364501954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,power_law_1.01,0.06030719876289368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,power_law_1.01,0.4328127861022949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,power_law_1.01,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,power_law_1.01,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.14903680086135865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,power_law_1.01,0.45963521003723146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,power_law_1.01,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,power_law_1.2,0.19140479564666749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,power_law_1.01,0.08406400084495544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,power_law_1.01,0.535423994064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,power_law_1.01,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,power_law_1.2,0.22520959377288818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,power_law_1.01,0.5907392024993896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,power_law_1.01,0.1133504033088684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,power_law_1.2,0.295251202583313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,power_law_1.01,0.12482559680938721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,power_law_1.01,0.7252799987792968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,power_law_1.01,0.17437440156936646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,power_law_1.2,0.29852800369262694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,power_law_1.01,0.8305407524108886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,power_law_1.01,0.2122431993484497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,power_law_1.2,0.3280191898345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,power_law_1.01,0.3015615940093994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,power_law_1.01,1.046412754058838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,power_law_1.01,0.3613440036773682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,power_law_1.2,0.3335423946380615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,power_law_1.01,1.2317376136779785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,power_law_1.01,0.43712639808654785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,power_law_1.2,0.36078081130981443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,power_law_1.01,0.6728447914123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,power_law_1.01,1.587071990966797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,power_law_1.2,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,power_law_1.01,0.9038656234741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,power_law_1.2,0.3661056041717529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,power_law_1.01,2.0689599990844725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,power_law_1.2,0.04373759925365448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,power_law_1.01,1.3492992401123047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,power_law_1.2,0.39171199798583983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,power_law_1.2,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,power_law_1.01,1.8078336715698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,power_law_1.01,2.7431615829467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,power_law_1.2,0.41689600944519045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,power_law_1.01,2.8476224899291993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,power_law_1.2,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,power_law_1.2,0.42612481117248535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,power_law_1.01,3.279539108276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,power_law_1.01,5.464960098266602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,power_law_1.2,0.045177599787712096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,power_law_1.2,0.45682559013366697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,power_law_1.2,0.04744960069656372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,power_law_1.01,3.9723777770996094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,power_law_1.2,0.04254080057144165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,power_law_1.2,0.5424384117126465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,power_law_1.2,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,power_law_1.01,6.0361473083496096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,power_law_1.2,0.6063360214233399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,power_law_1.2,0.049907198548316954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,power_law_1.2,0.7429376125335694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,power_law_1.2,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,power_law_1.2,0.056032001972198486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,power_law_1.01,11.537248229980468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,power_law_1.2,0.8641983985900878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,power_law_1.2,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,power_law_1.2,1.0737024307250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,power_law_1.2,0.06709759831428527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,power_law_1.2,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,power_law_1.2,1.2608832359313964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,power_law_1.2,0.07978879809379577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,power_law_1.2,1.6182655334472655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,power_law_1.2,0.09025279879570007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,power_law_1.2,0.10559999942779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,power_law_1.2,2.1308799743652345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,power_law_1.2,0.14083839654922486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,power_law_1.2,0.18240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,power_law_1.2,2.813670349121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,power_law_1.2,0.20144639015197754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,power_law_1.01,0.052723199129104614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,power_law_1.2,0.292576003074646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,power_law_1.2,3.3086719512939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,power_law_1.01,0.044940799474716187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,power_law_1.2,0.3433664083480835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,power_law_1.2,4.006630325317383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,power_law_1.01,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,power_law_1.2,0.5084415912628174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,power_law_1.01,0.04165120124816894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,power_law_1.2,0.6720831871032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,power_law_1.2,6.081868743896484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,power_law_1.01,0.04206719994544983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,power_law_1.2,1.0292287826538087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,power_law_1.2,1.419801616668701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,power_law_1.2,0.05004159808158874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,power_law_1.2,1.8095359802246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,power_law_1.2,11.54021759033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,power_law_1.2,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,power_law_1.01,0.05007359981536865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,power_law_1.2,2.9418560028076173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,power_law_1.01,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,power_law_1.01,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,power_law_1.2,4.982291030883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,power_law_1.01,0.0531391978263855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,power_law_1.2,0.040428799390792844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,power_law_1.01,0.05475839972496033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,power_law_1.2,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,power_law_1.01,0.057030397653579715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,power_law_1.2,0.04739840030670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,power_law_1.01,0.061324799060821535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,power_law_1.2,0.043699198961257936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,power_law_1.2,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,power_law_1.2,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,power_law_1.01,0.07935360074043274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,power_law_1.2,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,power_law_1.01,0.09348480105400085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,power_law_1.2,0.054118400812149046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,power_law_1.01,0.11457279920578003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,power_law_1.2,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,power_law_1.01,0.14958080053329467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,power_law_1.2,0.06172800064086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,power_law_1.01,0.15903359651565552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,power_law_1.2,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,power_law_1.01,0.23520638942718505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,power_law_1.2,0.0711296021938324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,power_law_1.01,0.3025791883468628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,power_law_1.2,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,power_law_1.01,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,power_law_1.01,0.385100793838501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,power_law_1.2,0.10001280307769775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,power_law_1.01,0.47849597930908205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,power_law_1.2,0.12028800249099732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,power_law_1.01,0.039052799344062805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,power_law_1.01,0.8022848129272461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,power_law_1.2,0.14140160083770753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,power_law_1.01,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,power_law_1.2,0.03658879995346069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,power_law_1.01,1.0373760223388673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,power_law_1.2,0.15839359760284424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,power_law_1.2,0.03823359906673431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,power_law_1.01,1.3988672256469727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,power_law_1.2,0.2278143882751465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,power_law_1.01,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,power_law_1.2,0.31055359840393065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,power_law_1.01,1.99237117767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,power_law_1.01,0.043968001008033754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,power_law_1.2,0.3887936115264893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,power_law_1.01,4.631033706665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,power_law_1.2,0.04273279905319214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,power_law_1.2,0.5808767795562744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,power_law_1.01,0.04704639911651611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,power_law_1.2,0.879263973236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,power_law_1.2,0.04499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,power_law_1.2,1.1940608024597168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,power_law_1.2,0.047225600481033324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,power_law_1.01,0.05315840244293213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,power_law_1.2,1.3251328468322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,power_law_1.2,0.050291198492050174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,power_law_1.01,0.053600001335144046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,power_law_1.2,0.049702399969100954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,power_law_1.2,2.546758460998535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,power_law_1.01,0.055852800607681274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,power_law_1.2,0.05336959958076477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,power_law_1.01,0.06627200245857238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,power_law_1.2,4.914252853393554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,power_law_1.01,0.0673088014125824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,power_law_1.2,0.05399680137634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,power_law_1.01,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,power_law_1.2,0.06749439835548401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,power_law_1.01,0.09043200016021728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,power_law_1.01,0.09434880018234253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,power_law_1.2,0.07610880136489868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,power_law_1.01,0.12138880491256714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,power_law_1.2,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,power_law_1.01,0.14001920223236083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,power_law_1.2,0.10069760084152221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,power_law_1.01,0.1764672040939331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,power_law_1.2,0.11172480583190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,power_law_1.01,0.21518080234527587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,power_law_1.2,0.14247679710388184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,power_law_1.01,0.32700159549713137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,power_law_1.2,0.17484159469604493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,power_law_1.01,0.403385591506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,power_law_1.01,0.036735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,power_law_1.2,0.24364159107208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,power_law_1.01,0.6231167793273926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,power_law_1.01,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,power_law_1.2,0.3353919982910156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,power_law_1.01,0.7736703872680664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,power_law_1.2,0.3853503942489624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,power_law_1.01,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,power_law_1.01,1.0650815963745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,power_law_1.2,0.6116543769836426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,power_law_1.01,0.041459199786186215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,power_law_1.01,1.4949760437011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,power_law_1.01,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,power_law_1.2,0.8137984275817871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,power_law_1.01,2.865286445617676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,power_law_1.01,0.045337599515914914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,power_law_1.2,0.9829504013061523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,power_law_1.2,0.03488639891147614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,power_law_1.2,1.4693440437316894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,power_law_1.01,0.04658559858798981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,power_law_1.2,0.036524799466133115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,power_law_1.2,3.5200191497802735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,power_law_1.01,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,power_law_1.2,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,power_law_1.2,0.04307200014591217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,power_law_1.01,0.05132799744606018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,power_law_1.2,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,power_law_1.01,0.05416319966316223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,power_law_1.2,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,power_law_1.01,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,power_law_1.2,0.04677119851112366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,power_law_1.01,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,power_law_1.2,0.045132800936698914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,power_law_1.2,0.046777600049972536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,power_law_1.01,0.0736191987991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,power_law_1.2,0.048416000604629514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,power_law_1.01,0.08693119883537292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,power_law_1.2,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,power_law_1.01,0.09653760194778442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,power_law_1.2,0.051692801713943484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,power_law_1.01,0.11683199405670167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,power_law_1.2,0.05374079942703247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,power_law_1.01,0.13772159814834595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,power_law_1.2,0.05414400100708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,power_law_1.01,0.1778432011604309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,power_law_1.2,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,power_law_1.01,0.22311038970947267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,power_law_1.2,0.0713536024093628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,power_law_1.01,0.3048192024230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,power_law_1.2,0.07339519858360291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,power_law_1.01,0.3894079923629761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,power_law_1.2,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,power_law_1.01,0.5591936111450195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,power_law_1.2,0.09387519955635071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,power_law_1.01,0.7314176082611084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,power_law_1.2,0.11457279920578003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,power_law_1.01,0.8981311798095704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,power_law_1.01,0.05912320017814636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,power_law_1.2,0.13646080493927001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,power_law_1.01,1.3878208160400392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,power_law_1.2,0.1758015990257263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,power_law_1.01,0.059520000219345094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,power_law_1.2,0.21756160259246826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,power_law_1.01,2.8062463760375977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,power_law_1.01,0.06035199761390686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,power_law_1.2,0.29989120960235593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,power_law_1.2,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,power_law_1.01,0.06116480231285095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,power_law_1.2,0.3871615886688232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,power_law_1.01,0.05953279733657837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,power_law_1.2,0.5546815872192383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,power_law_1.01,0.06157439947128296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,power_law_1.2,0.7142208099365235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,power_law_1.2,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,power_law_1.2,0.8833663940429688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,power_law_1.2,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,power_law_1.01,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,power_law_1.2,1.3828864097595215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,power_law_1.2,0.06362879872322083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,power_law_1.01,0.0701632022857666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,power_law_1.2,2.834931182861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,power_law_1.01,0.0767359972000122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,power_law_1.01,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,power_law_1.01,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,power_law_1.01,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,power_law_1.01,0.1146239995956421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,power_law_1.01,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,power_law_1.01,0.1509951949119568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,power_law_1.01,0.16787199974060057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,power_law_1.01,0.2297215938568115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,power_law_1.01,0.26985599994659426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,power_law_1.01,0.3947904109954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,power_law_1.01,0.5317823886871338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,power_law_1.01,0.8518272399902344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,power_law_1.01,0.9461119651794434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,power_law_1.01,1.5899904251098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,power_law_1.01,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,power_law_1.01,2.197644805908203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,power_law_1.01,0.05231999754905701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,power_law_1.01,2.701247978210449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,power_law_1.01,0.05886719822883606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,power_law_1.01,4.3240703582763675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,power_law_1.01,0.06169599890708923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,power_law_1.01,9.038572692871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,power_law_1.01,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,power_law_1.01,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,power_law_1.01,0.06378880143165588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,power_law_1.01,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,power_law_1.2,0.07134720087051391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,power_law_1.01,0.06542720198631287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,power_law_1.2,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,power_law_1.01,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,power_law_1.2,0.05023999810218811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,power_law_1.01,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,power_law_1.01,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,power_law_1.01,0.08960000276565552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,power_law_1.2,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,power_law_1.01,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,power_law_1.2,0.06213759779930115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,power_law_1.01,0.10454399585723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,power_law_1.2,0.06357120275497437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,power_law_1.01,0.1430400013923645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,power_law_1.2,0.06357120275497437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,power_law_1.01,0.1579967975616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,power_law_1.2,0.065830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,power_law_1.01,0.17907840013504028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,power_law_1.2,0.0662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,power_law_1.01,0.23539841175079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,power_law_1.2,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,power_law_1.01,0.33882880210876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,power_law_1.2,0.06991360187530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,power_law_1.01,0.43097600936889646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,power_law_1.2,0.07789440155029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,power_law_1.01,0.5927680015563965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,power_law_1.2,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,power_law_1.01,0.7428991794586182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,power_law_1.2,0.09880319833755494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,power_law_1.01,1.0957695960998535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,power_law_1.2,0.10001920461654663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,power_law_1.01,1.5862719535827636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,power_law_1.2,0.1348479986190796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,power_law_1.2,0.1553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,power_law_1.01,1.9243839263916016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,power_law_1.01,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,power_law_1.2,0.18645119667053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,power_law_1.01,0.0455808013677597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,power_law_1.01,3.2492481231689454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,power_law_1.2,0.26140799522399905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,power_law_1.01,0.04764800071716309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,power_law_1.01,7.2258049011230465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,power_law_1.2,0.3547967910766602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,power_law_1.01,0.05564799904823303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,power_law_1.01,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,power_law_1.2,0.4246335983276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,power_law_1.01,0.05994240045547485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,power_law_1.2,0.6740863800048829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,power_law_1.01,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,power_law_1.2,0.8903552055358886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,power_law_1.01,0.06403840184211732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,power_law_1.2,1.3243391990661622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,power_law_1.01,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,power_law_1.2,1.6546560287475587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,power_law_1.01,0.06689919829368592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,power_law_1.2,2.519321632385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,power_law_1.01,0.06567040085792542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,power_law_1.01,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,power_law_1.2,3.6414207458496093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,power_law_1.01,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,power_law_1.2,7.160704040527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,power_law_1.01,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,power_law_1.01,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,power_law_1.01,0.08615679740905761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,power_law_1.01,0.09210240244865417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,power_law_1.01,0.1276479959487915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,power_law_1.01,0.1619328022003174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,power_law_1.01,0.19531519412994386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,power_law_1.01,0.26270079612731934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,power_law_1.01,0.296889591217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,power_law_1.01,0.4883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,power_law_1.01,0.6161791801452636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,power_law_1.01,0.8592703819274903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,power_law_1.01,1.1240703582763671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,power_law_1.2,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,power_law_1.01,1.4439807891845704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,power_law_1.2,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,power_law_1.01,2.305350494384766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,power_law_1.2,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,power_law_1.2,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,power_law_1.01,5.4408447265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,power_law_1.2,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,power_law_1.2,0.06289920210838318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,power_law_1.2,0.06359040141105651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,power_law_1.2,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,power_law_1.2,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,power_law_1.2,0.06563199758529663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,power_law_1.2,0.06787199974060058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,power_law_1.2,0.06926079988479614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,power_law_1.2,0.07034239768981934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,power_law_1.01,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,power_law_1.2,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,power_law_1.2,0.08529279828071594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,power_law_1.2,0.08856959939002991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,power_law_1.01,0.0471807986497879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,power_law_1.2,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,power_law_1.01,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,power_law_1.2,0.11396479606628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,power_law_1.01,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,power_law_1.2,0.12952959537506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,power_law_1.01,0.06027519702911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,power_law_1.2,0.15627520084381102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,power_law_1.01,0.06417919993400574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,power_law_1.2,0.18031359910964967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,power_law_1.01,0.06418560147285461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,power_law_1.2,0.2655168056488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,power_law_1.01,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,power_law_1.2,0.34558079242706297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,power_law_1.01,0.0662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,power_law_1.2,0.5047232151031494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,power_law_1.01,0.06417919993400574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,power_law_1.2,0.5788479804992676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,power_law_1.01,0.07012479901313781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,power_law_1.2,0.8711104393005371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,power_law_1.01,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,power_law_1.2,1.2382975578308106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,power_law_1.01,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,power_law_1.01,0.08568320274353028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,power_law_1.2,1.4908224105834962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,power_law_1.2,0.03681919872760773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,power_law_1.2,2.503558349609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,power_law_1.2,0.043558400869369504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,power_law_1.01,0.09633280038833618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,power_law_1.2,5.4711040496826175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,power_law_1.2,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,power_law_1.01,0.11804159879684448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,power_law_1.2,0.057657599449157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,power_law_1.01,0.1292415976524353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,power_law_1.2,0.05852159857749939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,power_law_1.01,0.15368319749832154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,power_law_1.2,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,power_law_1.01,0.18133120536804198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,power_law_1.2,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,power_law_1.01,0.2421504020690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,power_law_1.2,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,power_law_1.01,0.29500160217285154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,power_law_1.2,0.06216959953308106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,power_law_1.01,0.4186880111694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,power_law_1.2,0.06362879872322083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,power_law_1.01,0.5382847785949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,power_law_1.2,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,power_law_1.01,0.7686272144317627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,power_law_1.2,0.06895359754562377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,power_law_1.01,1.0083071708679199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,power_law_1.2,0.07141119837760926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,power_law_1.2,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,power_law_1.01,1.256326389312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,power_law_1.2,0.08451840281486511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,power_law_1.01,2.002604866027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,power_law_1.2,0.08739200234413147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,power_law_1.01,4.0348350524902346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,power_law_1.2,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,power_law_1.2,0.11667200326919555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,power_law_1.2,0.12855679988861085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,power_law_1.2,0.15353599786758423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,power_law_1.2,0.18116480112075806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,power_law_1.01,0.11150720119476318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,power_law_1.2,0.2473344087600708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,power_law_1.2,0.2989567995071411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,power_law_1.01,0.16494079828262329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,power_law_1.2,0.42304000854492185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,power_law_1.01,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,power_law_1.2,0.5448959827423095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,power_law_1.01,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,power_law_1.2,0.7814464092254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,power_law_1.01,0.1016767978668213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,power_law_1.2,1.0300800323486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,power_law_1.2,1.2780672073364259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,power_law_1.01,0.11990400552749633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,power_law_1.2,2.0428096771240236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,power_law_1.01,0.1350592017173767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,power_law_1.2,4.672447967529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,power_law_1.01,0.13587839603424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,power_law_1.01,0.1418176054954529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,power_law_1.01,0.148364794254303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,power_law_1.01,0.15287679433822632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,power_law_1.01,0.15799039602279663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,power_law_1.2,0.11190400123596192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,power_law_1.01,0.160863995552063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,power_law_1.2,0.16596479415893556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,power_law_1.01,0.16188160181045533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,power_law_1.2,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,power_law_1.01,0.1745792031288147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,power_law_1.2,0.08876799941062927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,power_law_1.01,0.18685439825057984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,power_law_1.2,0.10533759593963624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,power_law_1.2,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,power_law_1.01,0.18257280588150024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,power_law_1.2,0.1118783950805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,power_law_1.2,0.06976640224456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,power_law_1.01,0.19832320213317872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,power_law_1.2,0.0761023998260498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,power_law_1.2,0.13934719562530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,power_law_1.2,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,power_law_1.01,0.2210239887237549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,power_law_1.2,0.13975679874420166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,power_law_1.01,0.2691839933395386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,power_law_1.2,0.14424320459365844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,power_law_1.2,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,power_law_1.01,0.2972480058670044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,power_law_1.2,0.14302719831466676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,power_law_1.2,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,power_law_1.01,0.35890560150146483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,power_law_1.2,0.15367679595947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,power_law_1.2,0.15557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,power_law_1.01,0.11277439594268798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,power_law_1.01,0.4274752140045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,power_law_1.2,0.15982719659805297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,power_law_1.2,0.17893120050430297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,power_law_1.01,0.1133952021598816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,power_law_1.2,0.22357120513916015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,power_law_1.01,0.5727039813995362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,power_law_1.2,0.15326720476150513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,power_law_1.01,0.08144639730453491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,power_law_1.2,0.29155840873718264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,power_law_1.2,0.1614527940750122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,power_law_1.01,0.7142144203186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,power_law_1.01,0.07813119888305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,power_law_1.2,0.3964224100112915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,power_law_1.2,0.1692415952682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,power_law_1.01,0.9345919609069824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,power_law_1.2,0.5813504219055176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,power_law_1.01,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,power_law_1.2,0.1778496026992798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,power_law_1.2,0.8035648345947266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,power_law_1.01,0.1078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,power_law_1.01,1.2837632179260254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,power_law_1.2,0.9677887916564941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,power_law_1.2,0.1897279977798462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,power_law_1.01,0.1346943974494934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,power_law_1.01,1.5334336280822753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,power_law_1.2,1.4497023582458497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,power_law_1.2,0.20856959819793702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,power_law_1.01,0.14287999868392945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,power_law_1.2,2.2246719360351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,power_law_1.01,2.3870208740234373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,power_law_1.2,0.22945280075073243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,power_law_1.01,0.14205440282821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,power_law_1.2,2.6561792373657225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,power_law_1.01,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,power_law_1.2,0.2747136116027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,power_law_1.01,4.774790573120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,power_law_1.2,4.619180679321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,power_law_1.01,0.1516991972923279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,power_law_1.2,0.31526401042938235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,power_law_1.2,9.250527954101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,power_law_1.01,0.15310720205307007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,power_law_1.2,0.414188814163208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,power_law_1.01,0.1580415964126587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,power_law_1.2,0.46129918098449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,power_law_1.01,0.16602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,power_law_1.2,0.6523647785186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,power_law_1.01,0.16929919719696046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,power_law_1.2,0.8450752258300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,power_law_1.01,0.17359999418258668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,power_law_1.2,1.0896127700805665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,power_law_1.01,0.18691840171813964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,power_law_1.2,1.3951744079589843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,power_law_1.01,0.21744000911712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,power_law_1.01,0.22972800731658935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,power_law_1.2,1.9083967208862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,power_law_1.01,0.2678015947341919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,power_law_1.2,2.936083221435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,power_law_1.01,0.2964159965515137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,power_law_1.01,0.3702143907546997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,power_law_1.2,6.305318450927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,power_law_1.01,0.42571520805358887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,power_law_1.01,0.5981632232666015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,power_law_1.01,0.7507328033447266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,power_law_1.2,0.09758080244064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,power_law_1.2,0.11334400177001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,power_law_1.01,1.0435968399047852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,power_law_1.2,0.06706560254096985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,power_law_1.01,1.3464703559875488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,power_law_1.2,0.07730559706687927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,power_law_1.01,1.5289728164672851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,power_law_1.01,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,power_law_1.2,0.0996288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,power_law_1.01,0.08922240138053894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,power_law_1.01,2.4518016815185546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,power_law_1.2,0.10698879957199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,power_law_1.01,0.07159680128097534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,power_law_1.2,0.13608319759368898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,power_law_1.01,5.191603088378907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,power_law_1.01,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,power_law_1.2,0.14343680143356324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,power_law_1.01,0.10067839622497558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,power_law_1.2,0.1438655972480774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,power_law_1.01,0.11542400121688842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,power_law_1.2,0.15185279846191407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,power_law_1.01,0.1402176022529602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,power_law_1.2,0.15614080429077148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,power_law_1.01,0.14410239458084106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,power_law_1.2,0.1622912049293518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,power_law_1.01,0.1608896017074585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,power_law_1.2,0.16475520133972169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,power_law_1.01,0.15783040523529052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,power_law_1.2,0.1627071976661682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,power_law_1.01,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,power_law_1.2,0.17745280265808105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,power_law_1.2,0.08076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,power_law_1.01,0.17032320499420167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,power_law_1.2,0.1819584012031555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,power_law_1.2,0.08999040126800537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,power_law_1.01,0.17400959730148316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,power_law_1.2,0.1923840045928955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,power_law_1.2,0.06438400149345398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,power_law_1.01,0.17605760097503662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,power_law_1.01,0.18424960374832153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,power_law_1.2,0.09203839898109437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,power_law_1.01,0.18670079708099366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,power_law_1.2,0.10882560014724732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,power_law_1.01,0.22520320415496825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,power_law_1.2,0.14835200309753419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,power_law_1.01,0.24138240814208983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,power_law_1.2,0.15124479532241822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,power_law_1.01,0.24487040042877198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,power_law_1.2,0.1549183964729309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,power_law_1.01,0.2989376068115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,power_law_1.2,0.15409280061721803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,power_law_1.01,0.3261631965637207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,power_law_1.2,0.15777280330657958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,power_law_1.2,0.1708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,power_law_1.01,0.42346878051757814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,power_law_1.2,0.16883200407028198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,power_law_1.01,0.48755202293395994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,power_law_1.2,0.18153599500656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,power_law_1.01,0.6556992053985595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,power_law_1.2,0.18685439825057984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,power_law_1.01,0.7998720169067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,power_law_1.01,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,power_law_1.2,0.19627519845962524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,power_law_1.01,1.118336009979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,power_law_1.01,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,power_law_1.2,0.20775039196014405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,power_law_1.01,0.08227199912071229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,power_law_1.01,1.423078441619873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,power_law_1.2,0.2329472064971924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,power_law_1.01,1.7571071624755858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,power_law_1.2,0.24908800125122071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,power_law_1.01,0.11093759536743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,power_law_1.01,2.539027214050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,power_law_1.2,0.306060791015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,power_law_1.01,0.1379520058631897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,power_law_1.01,0.17646080255508423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,power_law_1.2,0.3547967910766602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,power_law_1.01,5.234124755859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,power_law_1.01,0.18466559648513795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,power_law_1.2,0.43753600120544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,power_law_1.01,0.19018239974975587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,power_law_1.2,0.5477183818817138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,power_law_1.01,0.19510400295257568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,power_law_1.2,0.7023488044738769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,power_law_1.01,0.19120639562606812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,power_law_1.2,0.8375167846679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,power_law_1.01,0.20248959064483643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,power_law_1.2,1.1715328216552734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,power_law_1.01,0.2112895965576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,power_law_1.2,1.5329983711242676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,power_law_1.01,0.2431936025619507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,power_law_1.01,0.25553278923034667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,power_law_1.2,1.8368703842163085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,power_law_1.01,0.27314560413360595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,power_law_1.2,2.8562175750732424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,power_law_1.01,0.25224320888519286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,power_law_1.01,0.27968640327453614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,power_law_1.2,5.823161697387695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,power_law_1.01,0.3089087963104248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,power_law_1.01,0.3739007949829102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,power_law_1.01,0.43588480949401853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,power_law_1.01,0.5420351982116699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,power_law_1.01,0.6333824157714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,power_law_1.01,0.8396096229553223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,power_law_1.01,1.054246425628662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,power_law_1.01,1.4427455902099608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,power_law_1.01,1.8787776947021484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,power_law_1.01,2.265145683288574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,power_law_1.01,3.3711360931396483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,power_law_1.2,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,power_law_1.01,6.900460815429687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,power_law_1.2,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,power_law_1.2,0.10969599485397338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,power_law_1.2,0.1264256000518799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,power_law_1.2,0.16970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,power_law_1.2,0.17640960216522217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,power_law_1.2,0.18260480165481568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,power_law_1.2,0.18672640323638917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,power_law_1.2,0.2006335973739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,power_law_1.2,0.20391039848327636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,power_law_1.2,0.20923519134521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,power_law_1.2,0.2194751977920532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,power_law_1.2,0.22787199020385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,power_law_1.2,0.241593599319458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,power_law_1.2,0.2583872079849243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,power_law_1.2,0.2857599973678589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,power_law_1.2,0.31655681133270264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,power_law_1.2,0.3806591987609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,power_law_1.2,0.4482431888580322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,power_law_1.2,0.5784832000732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,power_law_1.2,0.656115198135376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,power_law_1.2,0.8695103645324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,power_law_1.2,1.1089152336120605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,power_law_1.01,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,power_law_1.2,1.5183103561401368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,power_law_1.01,0.07215999960899352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,power_law_1.2,1.9703168869018555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,power_law_1.01,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,power_law_1.2,2.412467193603516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,power_law_1.01,0.1082111954689026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,power_law_1.01,0.13853440284729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,power_law_1.2,3.565702438354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,power_law_1.01,0.17763839960098265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,power_law_1.2,7.617247772216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,power_law_1.01,0.23109118938446044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,power_law_1.01,0.2425600051879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,power_law_1.01,0.250982403755188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,power_law_1.01,0.2585472106933594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,power_law_1.01,0.29499518871307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,power_law_1.01,0.31404800415039064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,power_law_1.01,0.32408320903778076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,power_law_1.2,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,power_law_1.01,0.3285952091217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,power_law_1.01,0.3580735921859741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,power_law_1.2,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,power_law_1.01,0.3941184043884277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,power_law_1.01,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,power_law_1.2,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,power_law_1.01,0.33841919898986816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,power_law_1.01,0.04787200093269348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,power_law_1.2,0.12524800300598143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,power_law_1.01,0.38920960426330564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,power_law_1.2,0.17136640548706056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,power_law_1.01,0.04395520091056824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,power_law_1.01,0.43795199394226075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,power_law_1.2,0.23544960021972655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,power_law_1.01,0.049907198548316954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,power_law_1.01,0.5341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,power_law_1.2,0.23340160846710206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,power_law_1.01,0.6284031867980957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,power_law_1.2,0.24467840194702148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,power_law_1.2,0.25552639961242674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,power_law_1.01,0.79203200340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,power_law_1.01,0.05994240045547485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,power_law_1.2,0.2694463968276978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,power_law_1.01,1.0038016319274903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,power_law_1.01,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,power_law_1.01,0.06156799793243408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,power_law_1.2,0.2807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,power_law_1.01,1.2837696075439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,power_law_1.2,0.2821376085281372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,power_law_1.01,1.5735551834106445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,power_law_1.01,0.06465920209884643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,power_law_1.2,0.35260159969329835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,power_law_1.01,2.152934455871582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,power_law_1.01,0.06791039705276489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,power_law_1.2,0.37880959510803225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,power_law_1.01,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,power_law_1.01,2.7310848236083984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,power_law_1.2,0.3993024110794067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,power_law_1.01,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,power_law_1.2,0.3513727903366089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,power_law_1.01,3.3167999267578123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,power_law_1.01,0.0761023998260498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,power_law_1.2,0.4042111873626709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,power_law_1.01,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,power_law_1.01,5.048608016967774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,power_law_1.2,0.44496002197265627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,power_law_1.01,0.08655359745025634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,power_law_1.01,0.10151040554046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,power_law_1.2,0.5420479774475098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,power_law_1.01,9.761254119873048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,power_law_1.01,0.11767679452896118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,power_law_1.2,0.6479231834411621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,power_law_1.01,0.13099520206451415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,power_law_1.2,0.7978367805480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,power_law_1.01,0.17155200242996216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,power_law_1.2,1.0202560424804688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,power_law_1.01,0.20554239749908448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,power_law_1.2,1.3010175704956055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,power_law_1.01,0.2805056095123291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,power_law_1.2,1.5965439796447753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,power_law_1.01,0.35790719985961916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,power_law_1.2,2.1669248580932616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,power_law_1.01,0.4916543960571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,power_law_1.2,0.20938880443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,power_law_1.01,0.682700777053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,power_law_1.2,2.747315216064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,power_law_1.2,0.23745920658111572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,power_law_1.01,0.8101247787475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,power_law_1.2,3.33570556640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,power_law_1.2,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,power_law_1.2,0.2835200071334839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,power_law_1.01,1.360409641265869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,power_law_1.2,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,power_law_1.2,5.058060836791992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,power_law_1.2,0.31159679889678954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,power_law_1.01,2.636102485656738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,power_law_1.2,0.38327679634094236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,power_law_1.2,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,power_law_1.2,9.769094085693359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,power_law_1.2,0.45186557769775393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,power_law_1.2,0.657696008682251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,power_law_1.2,0.05906559824943543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,power_law_1.2,0.05803520083427429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,power_law_1.2,0.7861760139465332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,power_law_1.2,0.06275200247764587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,power_law_1.2,1.1125311851501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,power_law_1.2,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,power_law_1.2,1.443507194519043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,power_law_1.2,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,power_law_1.2,1.6161727905273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,power_law_1.2,0.06559360027313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,power_law_1.2,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,power_law_1.2,2.784543991088867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,power_law_1.01,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,power_law_1.2,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,power_law_1.2,5.71789436340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,power_law_1.2,0.05625600218772888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,power_law_1.01,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,power_law_1.2,0.07667840123176575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,power_law_1.01,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,power_law_1.2,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,power_law_1.2,0.0398719996213913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,power_law_1.01,0.04232319891452789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,power_law_1.2,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,power_law_1.2,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,power_law_1.01,0.04622719883918762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,power_law_1.2,0.09449599981307984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,power_law_1.2,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,power_law_1.01,0.05542399883270264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,power_law_1.2,0.1123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,power_law_1.2,0.05952640175819397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,power_law_1.01,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,power_law_1.2,0.12807680368423463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,power_law_1.2,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,power_law_1.01,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,power_law_1.2,0.15941120386123658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,power_law_1.2,0.061587202548980716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,power_law_1.01,0.06179839968681335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,power_law_1.2,0.18276480436325074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,power_law_1.01,0.0630016028881073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,power_law_1.2,0.21858561038970947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,power_law_1.01,0.06424319744110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,power_law_1.2,0.06566399931907654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,power_law_1.2,0.3191551923751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,power_law_1.2,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,power_law_1.2,0.4113152027130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,power_law_1.01,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,power_law_1.2,0.06751999855041504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,power_law_1.01,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,power_law_1.2,0.6781375885009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,power_law_1.01,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,power_law_1.2,0.07304959893226623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,power_law_1.2,0.7998144149780273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,power_law_1.01,0.0787775993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,power_law_1.01,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,power_law_1.2,1.2153727531433105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,power_law_1.01,0.08328319787979126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,power_law_1.01,0.04863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,power_law_1.01,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,power_law_1.2,1.9633024215698243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,power_law_1.01,0.06275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,power_law_1.01,0.09454079866409301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,power_law_1.01,0.06542720198631287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,power_law_1.01,0.10151040554046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,power_law_1.2,4.306406402587891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,power_law_1.01,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,power_law_1.01,0.1232192039489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,power_law_1.01,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,power_law_1.01,0.1363263964653015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,power_law_1.01,0.16992000341415406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,power_law_1.01,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,power_law_1.01,0.21374080181121827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,power_law_1.01,0.07362560033798218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,power_law_1.01,0.30254719257354734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,power_law_1.01,0.37389440536499025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,power_law_1.01,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,power_law_1.01,0.525651216506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,power_law_1.01,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,power_law_1.01,0.7130368232727051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,power_law_1.01,0.09471359848976135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,power_law_1.01,0.8076800346374512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,power_law_1.01,0.09306880235671997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,power_law_1.01,1.341164779663086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,power_law_1.01,0.11146880388259887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,power_law_1.01,0.11847039461135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,power_law_1.2,0.0471807986497879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,power_law_1.01,2.72293758392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,power_law_1.01,0.14058239459991456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,power_law_1.2,0.0414463996887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,power_law_1.01,0.16679680347442627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,power_law_1.2,0.03939839899539947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,power_law_1.01,0.21594879627227784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,power_law_1.2,0.044121599197387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,power_law_1.01,0.24892799854278563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,power_law_1.2,0.04962559938430786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,power_law_1.01,0.3326911926269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,power_law_1.2,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,power_law_1.2,0.06601600050926208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,power_law_1.01,0.40704002380371096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,power_law_1.2,0.06828799843788147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,power_law_1.01,0.5787775993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,power_law_1.2,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,power_law_1.01,0.764185619354248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,power_law_1.2,0.07074559926986694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,power_law_1.01,0.9313088417053222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,power_law_1.2,0.07667199969291687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,power_law_1.01,1.4385727882385253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,power_law_1.2,0.08015360236167908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,power_law_1.2,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,power_law_1.01,2.881612777709961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,power_law_1.2,0.08240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,power_law_1.2,0.08936960101127625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,power_law_1.2,0.09756159782409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,power_law_1.2,0.09654399752616882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,power_law_1.2,0.10636800527572632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,power_law_1.01,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,power_law_1.2,0.11887359619140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,power_law_1.2,0.13954559564590455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,power_law_1.01,0.048876801133155824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,power_law_1.2,0.16945279836654664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,power_law_1.01,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,power_law_1.2,0.20979840755462648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,power_law_1.01,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,power_law_1.2,0.26407680511474607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,power_law_1.01,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,power_law_1.2,0.3459840059280396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,power_law_1.01,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,power_law_1.2,0.4217535972595215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,power_law_1.01,0.08082559704780579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,power_law_1.2,0.6279935836791992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,power_law_1.01,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,power_law_1.2,0.803923225402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,power_law_1.01,0.09412479996681214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,power_law_1.2,1.1752127647399901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,power_law_1.01,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,power_law_1.01,0.10151040554046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,power_law_1.2,1.775481605529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,power_law_1.2,0.044947201013565065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,power_law_1.01,0.09311360120773315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,power_law_1.2,0.040243199467658995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,power_law_1.2,4.106111907958985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,power_law_1.01,0.09740800261497498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,power_law_1.2,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,power_law_1.01,0.10314240455627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,power_law_1.2,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,power_law_1.01,0.11336959600448608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,power_law_1.2,0.05722879767417908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,power_law_1.01,0.13223040103912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,power_law_1.2,0.0746944010257721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,power_law_1.01,0.1522879958152771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,power_law_1.2,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,power_law_1.01,0.18383359909057617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,power_law_1.2,0.08465279936790467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,power_law_1.01,0.21946239471435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,power_law_1.2,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,power_law_1.01,0.2608383893966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,power_law_1.2,0.09054080247879029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,power_law_1.2,0.09552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,power_law_1.01,0.34891519546508787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,power_law_1.2,0.10289920568466186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,power_law_1.01,0.45480961799621583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,power_law_1.2,0.10740480422973633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,power_law_1.01,0.5645503997802734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,power_law_1.2,0.10455039739608765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,power_law_1.01,0.82608003616333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,power_law_1.2,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,power_law_1.01,1.0227007865905762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,power_law_1.2,0.12174079418182374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,power_law_1.01,1.2655872344970702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,power_law_1.2,0.1164031982421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,power_law_1.01,1.9727615356445312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,power_law_1.2,0.13360639810562133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,power_law_1.2,0.15367679595947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,power_law_1.01,3.942124938964844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,power_law_1.2,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,power_law_1.2,0.21198720932006837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,power_law_1.2,0.281004810333252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,power_law_1.2,0.35112318992614744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,power_law_1.2,0.48506879806518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,power_law_1.2,0.5989247798919678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,power_law_1.2,0.8475071907043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,power_law_1.2,1.0761152267456056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,power_law_1.01,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,power_law_1.2,1.4062527656555175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,power_law_1.01,0.04411520063877106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,power_law_1.01,0.05292159914970398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,power_law_1.2,2.048019218444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,power_law_1.01,0.0639743983745575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,power_law_1.2,4.273235321044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,power_law_1.01,0.0713536024093628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,power_law_1.01,0.09789440035820007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,power_law_1.01,0.10576000213623046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,power_law_1.01,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,power_law_1.01,0.10862720012664795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,power_law_1.01,0.11063679456710815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,power_law_1.01,0.12193280458450317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,power_law_1.01,0.1336192011833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,power_law_1.01,0.13790719509124755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,power_law_1.01,0.14261120557785034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,power_law_1.01,0.1549056053161621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,power_law_1.01,0.15653760433197023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,power_law_1.01,0.16016000509262085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,power_law_1.01,0.19540480375289918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,power_law_1.01,0.2134783983230591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,power_law_1.2,0.04129279851913452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,power_law_1.01,0.26406400203704833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,power_law_1.2,0.04355199933052063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,power_law_1.01,0.30565121173858645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,power_law_1.2,0.05132799744606018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,power_law_1.01,0.4051839828491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,power_law_1.01,0.1248128056526184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,power_law_1.2,0.05953279733657837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,power_law_1.01,0.5018367767333984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,power_law_1.01,0.10310399532318115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,power_law_1.2,0.06935679912567139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,power_law_1.01,0.6765247821807862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,power_law_1.01,0.07525759935379028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,power_law_1.2,0.09905279874801635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,power_law_1.01,0.8423935890197753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,power_law_1.01,0.08017280101776122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,power_law_1.2,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,power_law_1.01,1.1862784385681153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,power_law_1.01,0.09470720291137695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,power_law_1.2,0.10949120521545411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,power_law_1.01,1.5149951934814454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,power_law_1.01,0.11293439865112305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,power_law_1.2,0.11276799440383911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,power_law_1.01,0.11150720119476318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,power_law_1.2,0.11706240177154541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,power_law_1.01,1.868876838684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,power_law_1.2,0.12689919471740724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,power_law_1.01,0.11887359619140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,power_law_1.01,2.891846466064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,power_law_1.2,0.14001280069351196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,power_law_1.01,0.11905920505523682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,power_law_1.2,0.138374400138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,power_law_1.01,0.12666239738464355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,power_law_1.01,5.640262222290039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,power_law_1.01,0.12830079793930055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,power_law_1.2,0.14103039503097534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,power_law_1.2,0.153056001663208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,power_law_1.01,0.12912000417709352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,power_law_1.2,0.15679999589920043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,power_law_1.01,0.13525760173797607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,power_law_1.2,0.15372159481048583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,power_law_1.01,0.13895039558410643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,power_law_1.2,0.18259840011596679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,power_law_1.01,0.1418176054954529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,power_law_1.2,0.21537280082702637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,power_law_1.01,0.15779199600219726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,power_law_1.2,0.26616320610046384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,power_law_1.01,0.16638720035552979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,power_law_1.2,0.3239232063293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,power_law_1.01,0.18933119773864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,power_law_1.2,0.4180607795715332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,power_law_1.01,0.19177600145339965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,power_law_1.01,0.2442176103591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,power_law_1.2,0.5043456077575683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,power_law_1.01,0.24995200634002684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,power_law_1.2,0.6711935997009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,power_law_1.01,0.3335103988647461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,power_law_1.2,0.844115161895752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,power_law_1.01,0.40047359466552734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,power_law_1.2,0.07427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,power_law_1.2,1.1982144355773925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,power_law_1.01,0.5280704021453857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,power_law_1.2,0.08513280153274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,power_law_1.2,1.5105216026306152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,power_law_1.2,0.08574720025062561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,power_law_1.01,0.6638400077819824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,power_law_1.2,0.13463040590286254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,power_law_1.2,1.8558336257934571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,power_law_1.2,0.08675839900970458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,power_law_1.2,0.07381119728088378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,power_law_1.01,0.9677632331848145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,power_law_1.2,2.883296012878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,power_law_1.01,1.28089599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,power_law_1.2,0.1064255952835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,power_law_1.2,0.08608639836311341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,power_law_1.2,5.638265609741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,power_law_1.01,1.4891776084899901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,power_law_1.2,0.12997759580612184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,power_law_1.2,0.09550719857215881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,power_law_1.2,0.1551743984222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,power_law_1.01,2.573388862609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,power_law_1.2,0.10817919969558716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,power_law_1.2,0.20103681087493896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,power_law_1.2,0.1211135983467102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,power_law_1.01,4.782976150512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,power_law_1.2,0.25756800174713135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,power_law_1.2,0.11928319931030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,power_law_1.2,0.33457279205322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,power_law_1.2,0.12828799486160278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,power_law_1.2,0.40911359786987306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,power_law_1.2,0.12296960353851319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,power_law_1.2,0.644646406173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,power_law_1.2,0.13215999603271483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,power_law_1.2,0.1297152042388916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,power_law_1.2,0.812985610961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,power_law_1.2,0.1368831992149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,power_law_1.2,1.0439935684204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,power_law_1.2,0.14179199934005737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,power_law_1.2,1.7558591842651368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,power_law_1.2,0.15204479694366455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,power_law_1.2,0.16965119838714598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,power_law_1.2,3.4708736419677733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,power_law_1.2,0.16145919561386107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,power_law_1.2,0.18398720026016235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,power_law_1.2,0.20980479717254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,power_law_1.2,0.2831167936325073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,power_law_1.01,0.1017024040222168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,power_law_1.2,0.2661184072494507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,power_law_1.01,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,power_law_1.01,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,power_law_1.2,0.3615551948547363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,power_law_1.01,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,power_law_1.2,0.44121599197387695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,power_law_1.2,0.10188159942626954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,power_law_1.01,0.09085440039634704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,power_law_1.2,0.07013760209083557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,power_law_1.2,0.6308735847473145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,power_law_1.01,0.110099196434021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,power_law_1.2,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,power_law_1.2,0.8931455612182617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,power_law_1.01,0.11708159446716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,power_law_1.2,0.08058239817619324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,power_law_1.2,1.1153984069824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,power_law_1.01,0.12076799869537354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,power_law_1.2,0.09326720237731934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,power_law_1.2,1.6153343200683594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,power_law_1.2,0.11005439758300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,power_law_1.2,1.8873151779174804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,power_law_1.2,0.11476479768753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,power_law_1.2,0.11930240392684936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,power_law_1.2,3.451142501831055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,power_law_1.2,0.12256640195846558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,power_law_1.2,7.7546241760253904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,power_law_1.01,0.08512639999389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,power_law_1.01,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,power_law_1.01,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,power_law_1.01,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,power_law_1.01,0.09106559753417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,power_law_1.01,0.11945600509643554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,power_law_1.01,0.12527999877929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,power_law_1.01,0.12282240390777588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,power_law_1.01,0.12814079523086547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,power_law_1.01,0.1303936004638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,power_law_1.01,0.1387712001800537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,power_law_1.01,0.14568320512771607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,power_law_1.01,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,power_law_1.01,0.14902399778366088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,power_law_1.01,0.16419199705123902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,power_law_1.01,0.16808320283889772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,power_law_1.01,0.17319680452346803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,power_law_1.01,0.19162880182266234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,power_law_1.01,0.21517438888549806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,power_law_1.2,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,power_law_1.01,0.2600127935409546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,power_law_1.2,0.06255360245704651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,power_law_1.01,0.2829632043838501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,power_law_1.2,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,power_law_1.01,0.364467191696167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,power_law_1.2,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,power_law_1.01,0.44292478561401366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,power_law_1.2,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,power_law_1.01,0.5821824073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,power_law_1.2,0.12151039838790893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,power_law_1.01,0.7314688205718994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,power_law_1.2,0.11846400499343872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,power_law_1.01,1.0317248344421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,power_law_1.2,0.126636803150177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,power_law_1.01,1.3759872436523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,power_law_1.2,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,power_law_1.01,1.6444799423217773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,power_law_1.2,0.13155839443206788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,power_law_1.2,0.14261759519577027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,power_law_1.01,2.618079948425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,power_law_1.2,0.1467136025428772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,power_law_1.01,4.958963012695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,power_law_1.2,0.15287040472030639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,power_law_1.2,0.1479423999786377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,power_law_1.2,0.1590016007423401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,power_law_1.2,0.15983359813690184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,power_law_1.2,0.17703039646148683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,power_law_1.2,0.2003711938858032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,power_law_1.2,0.220032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,power_law_1.2,0.26202239990234377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,power_law_1.2,0.30503039360046386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,power_law_1.2,0.37200000286102297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,power_law_1.2,0.44858880043029786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,power_law_1.2,0.5833536148071289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,power_law_1.2,0.7621439933776856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,power_law_1.2,1.0345279693603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,power_law_1.2,1.3431551933288575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,power_law_1.2,1.9166015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,power_law_1.2,2.9365055084228517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,power_law_1.2,5.564908981323242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,power_law_1.01,0.06670719981193543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,power_law_1.01,0.08104320168495179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,power_law_1.01,0.0976256012916565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,power_law_1.01,0.13040000200271606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,power_law_1.01,0.1363136053085327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,power_law_1.01,0.14902399778366088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,power_law_1.01,0.1486207962036133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,power_law_1.01,0.15557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,power_law_1.01,0.16417920589447021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,power_law_1.01,0.17278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,power_law_1.01,0.17975679636001587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,power_law_1.01,0.18343039751052856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,power_law_1.01,0.19531519412994386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,power_law_1.01,0.1977728009223938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,power_law_1.01,0.20227839946746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,power_law_1.01,0.2346496105194092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,power_law_1.01,0.25736958980560304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,power_law_1.01,0.31738240718841554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,power_law_1.01,0.36754560470581055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,power_law_1.2,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,power_law_1.01,0.4404607772827148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,power_law_1.2,0.0670527994632721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,power_law_1.01,0.582585620880127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,power_law_1.2,0.08076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,power_law_1.01,0.7474559783935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,power_law_1.2,0.09715200066566468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,power_law_1.01,0.9055616378784179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,power_law_1.2,0.12991360425949097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,power_law_1.01,1.3013567924499512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,power_law_1.2,0.1411967992782593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,power_law_1.01,1.5981887817382812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,power_law_1.2,0.14610559940338136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,power_law_1.01,2.0309247970581055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,power_law_1.2,0.15244799852371216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,power_law_1.2,0.15592960119247437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,power_law_1.01,3.0713216781616213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,power_law_1.2,0.16739840507507325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,power_law_1.2,0.17620480060577393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,power_law_1.01,5.960435104370117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,power_law_1.2,0.17990399599075318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,power_law_1.2,0.18255360126495362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,power_law_1.2,0.19587199687957763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,power_law_1.2,0.1991487979888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,power_law_1.2,0.20992639064788818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,power_law_1.2,0.23724160194396973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,power_law_1.2,0.2603840112686157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,power_law_1.2,0.31587839126586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,power_law_1.2,0.37075200080871584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,power_law_1.2,0.4662015914916992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,power_law_1.2,0.5821184158325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,power_law_1.2,0.7781184196472168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,power_law_1.2,0.9440064430236816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,power_law_1.2,1.3333312034606934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,power_law_1.2,1.7057855606079102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,power_law_1.2,2.125907135009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,power_law_1.2,3.447897720336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,power_law_1.2,6.411135864257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,power_law_1.01,0.12033920288085938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,power_law_1.01,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,power_law_1.01,0.1269055962562561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,power_law_1.01,0.12977919578552247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,power_law_1.01,0.1356735944747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,power_law_1.2,0.12461440563201905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,power_law_1.01,0.1379647970199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,power_law_1.2,0.13300479650497438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,power_law_1.01,0.14922879934310912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,power_law_1.2,0.130348801612854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,power_law_1.01,0.15312639474868775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,power_law_1.2,0.14243199825286865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,power_law_1.01,0.15598080158233643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,power_law_1.2,0.148364794254303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,power_law_1.01,0.05952640175819397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,power_law_1.2,0.15429760217666627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,power_law_1.01,0.17646080255508423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,power_law_1.01,0.06670719981193543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,power_law_1.2,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,power_law_1.01,0.20042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,power_law_1.01,0.07898880243301391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,power_law_1.2,0.16209280490875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,power_law_1.01,0.24896640777587892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,power_law_1.01,0.09966719746589661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,power_law_1.2,0.18214399814605714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,power_law_1.01,0.2612607955932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,power_law_1.01,0.11830400228500366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,power_law_1.2,0.20817279815673828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,power_law_1.01,0.31409919261932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,power_law_1.01,0.17052160501480101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,power_law_1.2,0.25281920433044436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,power_law_1.01,0.3906816005706787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,power_law_1.01,0.1801599979400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,power_law_1.2,0.2692032098770142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,power_law_1.01,0.19039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,power_law_1.01,0.5170368194580078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,power_law_1.2,0.33882880210876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,power_law_1.01,0.1891711950302124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,power_law_1.01,0.634611177444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,power_law_1.2,0.408460807800293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,power_law_1.01,0.19102079868316652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,power_law_1.01,0.8965375900268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,power_law_1.2,0.5804992198944092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,power_law_1.01,0.20023679733276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,power_law_1.01,1.2162431716918944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,power_law_1.01,0.20842878818511962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,power_law_1.2,0.6822720050811768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,power_law_1.01,1.412012767791748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,power_law_1.01,0.20740480422973634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,power_law_1.2,1.0398655891418458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,power_law_1.01,2.2476032257080076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,power_law_1.01,0.2217344045639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,power_law_1.2,1.2981120109558106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,power_law_1.01,0.23381760120391845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,power_law_1.01,4.979020690917968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,power_law_1.2,1.776313591003418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,power_law_1.01,0.24568960666656495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,power_law_1.2,2.6204992294311524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,power_law_1.01,0.2633023977279663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,power_law_1.01,0.3177664041519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,power_law_1.2,0.0604095995426178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,power_law_1.2,5.553843307495117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,power_law_1.01,0.3534080028533936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,power_law_1.2,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,power_law_1.01,0.44250879287719724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,power_law_1.2,0.07893120050430298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,power_law_1.01,0.5100927829742432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,power_law_1.2,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,power_law_1.2,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,power_law_1.01,0.6646463871002197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,power_law_1.2,0.16987520456314087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,power_law_1.01,0.8322367668151855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,power_law_1.2,0.17804800271987914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,power_law_1.01,1.092953586578369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,power_law_1.2,0.19176959991455078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,power_law_1.01,1.3411520004272461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,power_law_1.2,0.19585920572280885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,power_law_1.01,1.8587007522583008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,power_law_1.2,0.1995519995689392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,power_law_1.01,2.378886413574219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,power_law_1.2,0.2048703908920288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,power_law_1.01,2.9283647537231445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,power_law_1.2,0.21511681079864503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,power_law_1.2,0.2134783983230591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,power_law_1.01,4.527840042114258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,power_law_1.2,0.2323199987411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,power_law_1.01,0.12914559841156006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,power_law_1.2,0.24420480728149413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,power_law_1.01,8.96300811767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,power_law_1.2,0.25116159915924074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,power_law_1.01,0.16254080533981324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,power_law_1.2,0.2669440031051636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,power_law_1.01,0.21004800796508788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,power_law_1.2,0.11867519617080688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,power_law_1.2,0.3214207887649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,power_law_1.01,0.0902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,power_law_1.2,0.1659775972366333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,power_law_1.2,0.3572544097900391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,power_law_1.01,0.1004863977432251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,power_law_1.2,0.43834238052368163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,power_law_1.2,0.11006079912185669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,power_law_1.01,0.12997119426727294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,power_law_1.2,0.5202688217163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,power_law_1.2,0.09676160216331482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,power_law_1.2,0.6626304149627685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,power_law_1.01,0.1449280023574829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,power_law_1.2,0.09800320267677307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,power_law_1.2,0.8395520210266113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,power_law_1.01,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,power_law_1.2,0.12295680046081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,power_law_1.2,1.0969856262207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,power_law_1.01,0.1731775999069214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,power_law_1.2,0.14611200094223023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,power_law_1.2,1.3468416213989258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,power_law_1.01,0.17605760097503662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,power_law_1.2,0.1631168007850647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,power_law_1.2,1.8758399963378907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,power_law_1.01,0.18096640110015869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,power_law_1.2,0.17537280321121215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,power_law_1.2,2.3886592864990233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,power_law_1.01,0.19448319673538209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,power_law_1.2,0.17375999689102173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,power_law_1.2,2.9389568328857423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,power_law_1.2,0.182150399684906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,power_law_1.01,0.19242240190505983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,power_law_1.2,4.579411315917969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,power_law_1.2,0.18072320222854615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,power_law_1.01,0.20592639446258545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,power_law_1.01,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,power_law_1.2,0.19587839841842652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,power_law_1.01,0.20629758834838868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,power_law_1.2,9.100780487060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,power_law_1.01,0.11360000371932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,power_law_1.2,0.1993664026260376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,power_law_1.01,0.19653120040893554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,power_law_1.01,0.16787199974060057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,power_law_1.2,0.20817921161651612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,power_law_1.01,0.22357120513916015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,power_law_1.01,0.0798143982887268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,power_law_1.2,0.20694398880004883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,power_law_1.01,0.26410880088806155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,power_law_1.2,0.21962239742279052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,power_law_1.01,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,power_law_1.01,0.2506112098693848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,power_law_1.2,0.25689599514007566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,power_law_1.01,0.12900480031967163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,power_law_1.01,0.29278719425201416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,power_law_1.2,0.26654078960418703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,power_law_1.01,0.14042240381240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,power_law_1.01,0.35831680297851565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,power_law_1.2,0.31856000423431396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,power_law_1.01,0.15946240425109864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,power_law_1.01,0.41710720062255857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,power_law_1.2,0.3654592037200928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,power_law_1.01,0.1729920029640198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,power_law_1.01,0.5186944007873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,power_law_1.2,0.4752319812774658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,power_law_1.01,0.1707327961921692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,power_law_1.01,0.6450431823730469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,power_law_1.01,0.17996159791946412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,power_law_1.2,0.5456704139709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,power_law_1.01,0.7683328151702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,power_law_1.01,0.19183360338211058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,power_law_1.2,0.7179008007049561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,power_law_1.01,1.0760831832885742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,power_law_1.01,0.1901952028274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,power_law_1.2,0.8446847915649414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,power_law_1.01,1.3395071983337403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,power_law_1.01,0.19347200393676758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,power_law_1.2,1.1850560188293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,power_law_1.01,1.574028778076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,power_law_1.2,0.10657279491424561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,power_law_1.01,0.20351359844207764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,power_law_1.2,1.4725888252258301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,power_law_1.2,0.1155776023864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,power_law_1.01,2.38417911529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,power_law_1.01,0.21456639766693114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,power_law_1.2,1.8994047164916992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,power_law_1.2,0.10698239803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,power_law_1.01,0.22276480197906495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,power_law_1.01,4.831148910522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,power_law_1.2,0.08076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,power_law_1.2,2.6766143798828126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,power_law_1.01,0.25571839809417723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,power_law_1.2,0.10001280307769775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,power_law_1.01,0.2629055976867676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,power_law_1.2,6.132588958740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,power_law_1.2,0.11886719465255738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,power_law_1.01,0.3058367967605591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,power_law_1.2,0.1340224027633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,power_law_1.01,0.34973440170288084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,power_law_1.2,0.16145919561386107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,power_law_1.01,0.4400576114654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,power_law_1.2,0.16577279567718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,power_law_1.01,0.5252352237701416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,power_law_1.2,0.16391040086746217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,power_law_1.01,0.6720895767211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,power_law_1.2,0.1692415952682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,power_law_1.01,0.8109503746032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,power_law_1.2,0.18009599447250366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,power_law_1.01,1.0544384002685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,power_law_1.2,0.19381760358810424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,power_law_1.01,1.3763839721679687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,power_law_1.2,0.1987391948699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,power_law_1.01,1.6711040496826173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,power_law_1.2,0.2029439926147461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,power_law_1.2,0.21307520866394042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,power_law_1.01,2.5521535873413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,power_law_1.2,0.22615039348602295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,power_law_1.01,5.072012710571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,power_law_1.2,0.250764799118042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,power_law_1.2,0.27431039810180663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,power_law_1.2,0.329804801940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,power_law_1.2,0.36830720901489256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,power_law_1.01,0.0902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,power_law_1.2,0.4703104019165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,power_law_1.01,0.12198400497436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,power_law_1.2,0.5323264122009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,power_law_1.01,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,power_law_1.2,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,power_law_1.2,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,power_law_1.01,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,power_law_1.2,0.7113535881042481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,power_law_1.2,0.08158720135688782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,power_law_1.01,0.13017599582672118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,power_law_1.2,0.8379136085510254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,power_law_1.2,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,power_law_1.01,0.14410239458084106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,power_law_1.2,1.1621184349060059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,power_law_1.2,0.11886080503463745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,power_law_1.01,0.17358720302581787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,power_law_1.2,1.4365440368652345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,power_law_1.2,0.1336192011833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,power_law_1.01,0.18302079439163207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,power_law_1.2,1.7718015670776368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,power_law_1.2,0.1631168007850647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,power_law_1.01,0.18793599605560302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,power_law_1.2,2.9283199310302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,power_law_1.2,0.17212159633636476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,power_law_1.01,0.1891584038734436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,power_law_1.2,0.17685120105743407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,power_law_1.2,5.898521423339844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,power_law_1.2,0.18850560188293458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,power_law_1.2,0.2028480052947998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,power_law_1.2,0.1999935984611511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,power_law_1.2,0.2267904043197632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,power_law_1.2,0.2370431900024414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,power_law_1.2,0.24544000625610352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,power_law_1.2,0.2466752052307129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,power_law_1.2,0.2782144069671631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,power_law_1.01,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,power_law_1.2,0.2933631896972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,power_law_1.01,0.07408000230789184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,power_law_1.2,0.34858880043029783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,power_law_1.01,0.10355839729309083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,power_law_1.2,0.40273280143737794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,power_law_1.01,0.08836479783058167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,power_law_1.2,0.4944767951965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,power_law_1.01,0.11891839504241944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,power_law_1.2,0.5882495880126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,power_law_1.01,0.14739840030670165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,power_law_1.2,0.7748544216156006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,power_law_1.01,0.16787840127944947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,power_law_1.2,0.98538236618042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,power_law_1.01,0.2065471887588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,power_law_1.2,1.3042431831359864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,power_law_1.01,0.21496961116790772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,power_law_1.2,1.6952192306518554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,power_law_1.01,0.22644479274749757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,power_law_1.2,1.937491226196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,power_law_1.01,0.23934719562530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,power_law_1.01,0.24405760765075685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,power_law_1.2,3.1458112716674806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,power_law_1.01,0.24977920055389405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,power_law_1.2,5.819059371948242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,power_law_1.01,0.27067520618438723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,power_law_1.01,0.3095936059951782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,power_law_1.2,0.06682239770889283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,power_law_1.01,0.3235136032104492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,power_law_1.2,0.07442560195922851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,power_law_1.01,0.2993472099304199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,power_law_1.2,0.0844543993473053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,power_law_1.01,0.3272063970565796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,power_law_1.2,0.0881600022315979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,power_law_1.01,0.36878719329833987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,power_law_1.2,0.11210240125656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,power_law_1.01,0.43715200424194334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,power_law_1.2,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,power_law_1.2,0.16637439727783204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,power_law_1.01,0.4871551990509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,power_law_1.2,0.200927996635437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,power_law_1.01,0.612499189376831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,power_law_1.2,0.21571838855743408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,power_law_1.01,0.7396736145019531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,power_law_1.2,0.2188096046447754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,power_law_1.01,0.9714943885803222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,power_law_1.2,0.24337921142578126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,power_law_1.01,1.2067456245422363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,power_law_1.2,0.2622335910797119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,power_law_1.01,1.632192039489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,power_law_1.2,0.2716480016708374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,power_law_1.01,2.018239974975586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,power_law_1.2,0.2663167953491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,power_law_1.01,2.465715217590332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,power_law_1.2,0.276147198677063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,power_law_1.01,3.6627838134765627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,power_law_1.2,0.2814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,power_law_1.2,0.3039999961853027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,power_law_1.01,7.191827392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,power_law_1.2,0.34374399185180665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,power_law_1.2,0.37650558948516843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,power_law_1.2,0.4469503879547119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,power_law_1.2,0.49816322326660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,power_law_1.2,0.6112063884735107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,power_law_1.2,0.7473919868469239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,power_law_1.2,0.9915072441101074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,power_law_1.2,1.2186431884765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,power_law_1.2,1.6250816345214845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,power_law_1.2,1.9755775451660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,power_law_1.2,2.4446975708007814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,power_law_1.2,3.7720577239990236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,power_law_1.2,7.186918640136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,power_law_1.01,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,power_law_1.01,0.08958079814910888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,8,power_law_1.01,0.023014399409294128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,8,power_law_1.01,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,power_law_1.01,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,8,power_law_1.01,0.02242559939622879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,power_law_1.01,0.14673279523849486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,8,power_law_1.01,0.023219199478626253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,8,power_law_1.01,0.026713600754737853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,power_law_1.01,0.2151360034942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,8,power_law_1.01,0.028748801350593566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,power_law_1.01,0.24236159324645995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,8,power_law_1.01,0.028755199909210206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,8,power_law_1.01,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,power_law_1.01,0.31118719577789306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,8,power_law_1.01,0.03121280074119568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,power_law_1.01,0.3251136064529419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,8,power_law_1.01,0.032441601157188416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,8,power_law_1.01,0.03366400003433227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,power_law_1.01,0.3093440055847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,8,power_law_1.01,0.04323199987411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,power_law_1.01,0.3279616117477417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,8,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,8,power_law_1.01,0.04922879934310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,power_law_1.01,0.33658881187438966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,8,power_law_1.01,0.057011198997497556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,power_law_1.01,0.34497919082641604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,8,power_law_1.01,0.05864319801330566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,8,power_law_1.01,0.07728639841079712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,power_law_1.01,0.3611520051956177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,8,power_law_1.01,0.10350079536437988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,power_law_1.01,0.38020479679107666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,8,power_law_1.01,0.14076160192489623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,8,power_law_1.01,0.1790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,power_law_1.01,0.3879744052886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,8,power_law_1.01,0.2372351884841919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,power_law_1.01,0.4125376224517822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,8,power_law_1.01,0.3580672025680542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,power_law_1.01,0.47153921127319337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,8,power_law_1.01,0.4440959930419922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,8,power_law_1.01,0.6369984149932861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,power_law_1.01,0.5211071968078613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,8,power_law_1.01,0.8657279968261719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,power_law_1.01,0.6239232063293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,power_law_1.2,0.07264639735221863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,8,power_law_1.01,1.28090238571167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,8,power_law_1.01,1.83953914642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,power_law_1.01,0.7076608180999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,power_law_1.2,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,8,power_law_1.01,2.3784128189086915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,power_law_1.01,0.8883071899414062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,power_law_1.2,0.10478719472885131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,8,power_law_1.01,3.3344192504882812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,power_law_1.01,1.088806438446045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,power_law_1.2,0.13672959804534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,8,power_law_1.01,7.310208129882812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,power_law_1.2,0.17646080255508423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,power_law_1.01,1.4033663749694825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,power_law_1.2,0.20268800258636474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,power_law_1.01,1.8123519897460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,power_law_1.2,0.2702719926834106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,power_law_1.01,2.4198144912719726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,power_law_1.2,0.28051199913024905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,power_law_1.01,2.931590461730957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,2,8,power_law_1.2,0.02322559952735901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,power_law_1.2,0.30018560886383056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,2,8,power_law_1.2,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,power_law_1.01,3.5609409332275392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,2,8,power_law_1.2,0.02240000069141388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,power_law_1.2,0.33252480030059817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,2,8,power_law_1.2,0.02240640074014664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,power_law_1.01,5.442623901367187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,power_law_1.2,0.3644864082336426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,2,8,power_law_1.2,0.02588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,2,8,power_law_1.2,0.029977598786354066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,power_law_1.2,0.37655680179595946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,2,8,power_law_1.2,0.0297791987657547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,power_law_1.01,10.396550750732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,power_law_1.2,0.36119680404663085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,2,8,power_law_1.2,0.03203839957714081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,2,8,power_law_1.2,0.03142400085926056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,power_law_1.2,0.3673408031463623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,2,8,power_law_1.2,0.03079040050506592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,power_law_1.2,0.3888511896133423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,2,8,power_law_1.2,0.034483200311660765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,8,power_law_1.01,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,power_law_1.2,0.4173120021820068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,2,8,power_law_1.2,0.045535999536514285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,8,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,2,8,power_law_1.2,0.04575360119342804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,8,power_law_1.01,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,power_law_1.2,0.4797823905944824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,2,8,power_law_1.2,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,8,power_law_1.01,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,power_law_1.2,0.5293312072753906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,8,power_law_1.01,0.04513919949531555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,2,8,power_law_1.2,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,8,power_law_1.01,0.04575999975204468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,2,8,power_law_1.2,0.07443199753761291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,power_law_1.2,0.6397183895111084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,8,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,2,8,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,power_law_1.01,0.20391039848327636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,power_law_1.2,0.7253183841705322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,8,power_law_1.01,0.04658559858798981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,2,8,power_law_1.2,0.11067520380020142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,power_law_1.01,0.1985856056213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,8,power_law_1.01,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,2,8,power_law_1.2,0.12661759853363036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,power_law_1.2,0.9133376121520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,power_law_1.01,0.213318395614624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,8,power_law_1.01,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,2,8,power_law_1.2,0.1987328052520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,power_law_1.2,1.098681640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,8,power_law_1.01,0.050892800092697144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,2,8,power_law_1.2,0.2576832056045532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,power_law_1.01,0.22602880001068115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,8,power_law_1.01,0.05374720096588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,2,8,power_law_1.2,0.3490623950958252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,power_law_1.2,1.421440029144287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,power_law_1.01,0.22787199020385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,8,power_law_1.01,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,2,8,power_law_1.2,0.47521281242370605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,8,power_law_1.01,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,power_law_1.2,1.8328960418701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,power_law_1.01,0.24240639209747314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,2,8,power_law_1.2,0.728934383392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,8,power_law_1.01,0.07095680236816407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,2,8,power_law_1.2,0.9562944412231446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,power_law_1.01,0.2715008020401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,power_law_1.2,2.432147216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,8,power_law_1.01,0.06991999745368957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,2,8,power_law_1.2,1.3845248222351074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,8,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,power_law_1.01,0.29155840873718264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,power_law_1.2,2.9648128509521485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,2,8,power_law_1.2,1.705446434020996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,8,power_law_1.01,0.091839998960495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,power_law_1.01,0.3403007984161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,2,8,power_law_1.2,2.1656383514404296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,8,power_law_1.01,0.10003839731216431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,power_law_1.2,3.574720001220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,8,power_law_1.01,0.12742400169372559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,2,8,power_law_1.2,3.743008041381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,power_law_1.01,0.4021632194519043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,8,power_law_1.01,0.1446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,power_law_1.2,5.503936004638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,2,8,power_law_1.2,7.469747161865234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,power_law_1.01,0.4773119926452637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,8,power_law_1.01,0.19587839841842652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,8,power_law_1.01,0.2511744022369385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,power_law_1.01,0.5788928031921386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,power_law_1.2,10.408902740478515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,8,power_law_1.01,0.3744447946548462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,8,power_law_1.01,0.4295487880706787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,power_law_1.01,0.7674880027770996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,2,8,power_law_1.2,0.044326400756835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,8,power_law_1.01,0.6400767803192139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,power_law_1.01,0.8908096313476562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,2,8,power_law_1.2,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,8,power_law_1.01,0.8604288101196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,2,8,power_law_1.2,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,power_law_1.01,1.2133631706237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,8,power_law_1.01,1.0332672119140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,4,power_law_1.01,0.020812800526618956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,2,8,power_law_1.2,0.04431360065937042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,4,power_law_1.01,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,8,power_law_1.01,1.7799936294555665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,power_law_1.01,1.5113280296325684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,2,8,power_law_1.2,0.044710400700569156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,4,power_law_1.01,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,8,power_law_1.01,3.9885631561279298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,2,8,power_law_1.2,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,4,power_law_1.01,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,power_law_1.01,1.9227903366088868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,2,8,power_law_1.2,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,4,power_law_1.01,0.023270399868488313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,2,8,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,power_law_1.01,2.8906816482543944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,4,power_law_1.01,0.02736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,4,power_law_1.2,0.013388800621032714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,2,8,power_law_1.2,0.046777600049972536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,4,power_law_1.01,0.02655999958515167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,4,power_law_1.2,0.014336000382900237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,2,8,power_law_1.2,0.046982398629188536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,4,power_law_1.01,0.028806400299072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,power_law_1.01,5.319193649291992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,4,power_law_1.2,0.013107199966907502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,2,8,power_law_1.2,0.04963200092315674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,4,power_law_1.01,0.027584001421928406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,4,power_law_1.2,0.013395200669765472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,2,8,power_law_1.2,0.052300798892974856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,4,power_law_1.01,0.0286080002784729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,4,power_law_1.2,0.013817599415779114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,2,8,power_law_1.2,0.05414400100708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,4,power_law_1.01,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,4,power_law_1.2,0.01666560024023056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,2,8,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,4,power_law_1.01,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,4,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,4,power_law_1.2,0.016582399606704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,2,8,power_law_1.2,0.0674560010433197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,4,power_law_1.01,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,4,power_law_1.01,0.039052799344062805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,4,power_law_1.2,0.016780799627304076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,2,8,power_law_1.2,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,4,power_law_1.01,0.04168959856033325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,4,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,4,power_law_1.2,0.01626880019903183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,2,8,power_law_1.2,0.07910400032997131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,4,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,4,power_law_1.01,0.04886400103569031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,4,power_law_1.2,0.01648000031709671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,2,8,power_law_1.2,0.09878399968147278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,4,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,4,power_law_1.01,0.058713597059249875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,4,power_law_1.2,0.01645440012216568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,2,8,power_law_1.2,0.0959231972694397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,4,power_law_1.01,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,4,power_law_1.2,0.01401599943637848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,4,power_law_1.01,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,2,8,power_law_1.2,0.12378239631652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,4,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,4,power_law_1.2,0.014214399456977844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,4,power_law_1.01,0.07858560085296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,2,8,power_law_1.2,0.14958080053329467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,4,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,4,power_law_1.2,0.015046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,4,power_law_1.01,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,2,8,power_law_1.2,0.19874559640884398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,4,power_law_1.01,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,4,power_law_1.2,0.016467200219631196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,4,power_law_1.01,0.15353599786758423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,4,power_law_1.01,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,2,8,power_law_1.2,0.2526015996932983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,4,power_law_1.2,0.017292800545692443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,4,power_law_1.01,0.16254080533981324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,4,power_law_1.01,0.047040000557899475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,2,8,power_law_1.2,0.3642175912857056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,4,power_law_1.2,0.019334399700164796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,4,power_law_1.01,0.2510080099105835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,4,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,2,8,power_law_1.2,0.45554561614990235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,4,power_law_1.2,0.02261119931936264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,4,power_law_1.01,0.2639296054840088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,4,power_law_1.01,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,4,power_law_1.2,0.024665600061416625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,2,8,power_law_1.2,0.6769472122192383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,4,power_law_1.01,0.4801919937133789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,4,power_law_1.01,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,4,power_law_1.2,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,2,8,power_law_1.2,0.8973119735717774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,4,power_law_1.01,0.7814464092254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,4,power_law_1.01,0.06198400259017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,4,power_law_1.2,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,2,8,power_law_1.2,1.048038387298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,4,power_law_1.01,0.8449407577514648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,4,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,4,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,2,8,power_law_1.2,1.8643648147583007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,4,power_law_1.01,1.3374784469604493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,4,power_law_1.01,0.07141119837760926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,4,power_law_1.2,0.05436800122261047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,2,8,power_law_1.2,3.821644973754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,4,power_law_1.2,0.0738048017024994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,4,power_law_1.01,1.7960191726684571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,4,power_law_1.2,0.09491199851036072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,4,power_law_1.01,2.648396873474121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,4,power_law_1.2,0.13752959966659545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,4,power_law_1.01,5.226828765869141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,4,power_law_1.2,0.1774399995803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,4,power_law_1.2,0.048416000604629514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,4,power_law_1.2,0.21696000099182128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,4,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,4,power_law_1.2,0.337388801574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,4,power_law_1.2,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,4,power_law_1.2,0.6511424064636231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,2,power_law_1.01,0.01857919991016388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,4,power_law_1.2,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,2,power_law_1.01,0.018982400000095368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,4,power_law_1.2,0.04307839870452881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,2,power_law_1.01,0.019193600118160247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,4,power_law_1.2,0.04307839870452881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,2,power_law_1.01,0.018982400000095368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,4,power_law_1.2,0.04328320026397705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,2,power_law_1.2,0.018931199610233308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,2,power_law_1.01,0.020422400534152986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,4,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,2,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,2,power_law_1.01,0.02942720055580139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,2,power_law_1.2,0.018726399540901183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,4,power_law_1.2,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,2,power_law_1.01,0.027987200021743774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,2,power_law_1.2,0.01905920058488846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,4,power_law_1.2,0.04739840030670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,2,power_law_1.01,0.030457600951194763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,2,power_law_1.2,0.020160000026226043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,4,power_law_1.2,0.04759680032730103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,2,power_law_1.01,0.02881920039653778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,2,power_law_1.2,0.021798400580883025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,4,power_law_1.2,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,2,power_law_1.01,0.02942720055580139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,2,power_law_1.2,0.021196800470352172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,4,power_law_1.2,0.05086719989776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,2,power_law_1.01,0.03395200073719025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,2,power_law_1.2,0.022617599368095397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,4,power_law_1.2,0.0559935986995697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,2,power_law_1.01,0.038227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,2,power_law_1.2,0.02282239943742752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,4,power_law_1.2,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,2,power_law_1.01,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,2,power_law_1.2,0.023647999763488768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,4,power_law_1.2,0.06602240204811097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,2,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,2,power_law_1.2,0.024672000110149382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,4,power_law_1.2,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,2,power_law_1.01,0.04110080003738403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,2,power_law_1.2,0.027539199590682982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,4,power_law_1.2,0.09183359742164612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,2,power_law_1.01,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,2,power_law_1.2,0.02794879972934723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,4,power_law_1.2,0.09696000218391418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,2,power_law_1.01,0.052767997980117796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,2,power_law_1.2,0.028339201211929323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,4,power_law_1.2,0.12213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,2,power_law_1.01,0.0683456003665924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,2,power_law_1.2,0.03142400085926056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,4,power_law_1.2,0.13278720378875733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,2,power_law_1.01,0.08042880296707153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,2,power_law_1.2,0.04002560079097748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,4,power_law_1.2,0.1766144037246704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,2,power_law_1.01,0.1125823974609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,2,power_law_1.2,0.04165120124816894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,4,power_law_1.2,0.1860479950904846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,2,power_law_1.01,0.14595199823379518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,4,power_law_1.2,0.3148672103881836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,2,power_law_1.01,0.19736319780349731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,4,power_law_1.2,0.4625216007232666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,2,power_law_1.01,0.2518079996109009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,4,power_law_1.2,0.6597439765930175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,2,power_law_1.01,0.39844479560852053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,4,power_law_1.2,0.7826240062713623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,2,power_law_1.01,0.47362561225891114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,4,power_law_1.2,1.0394495964050292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,2,power_law_1.01,0.6831488132476806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,4,power_law_1.2,1.6591552734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,2,power_law_1.01,0.9854144096374512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,4,power_law_1.2,3.170572853088379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,2,power_law_1.01,1.2639552116394044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,2,power_law_1.01,1.9281280517578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,2,power_law_1.01,3.8372737884521486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,2,power_law_1.01,0.04043520092964172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,2,power_law_1.01,0.04022400081157684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,2,power_law_1.01,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,2,power_law_1.2,0.039673599600791934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,2,power_law_1.01,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,2,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,2,power_law_1.01,0.04083200097084046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,2,power_law_1.2,0.039263999462127684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,2,power_law_1.01,0.04267520010471344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,2,power_law_1.2,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,2,power_law_1.01,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,2,power_law_1.2,0.04149760007858276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,2,power_law_1.01,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,2,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,2,power_law_1.01,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,2,power_law_1.2,0.04232319891452789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,2,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,2,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,2,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,2,power_law_1.2,0.04312959909439087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,2,power_law_1.01,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,2,power_law_1.2,0.04438399970531463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,2,power_law_1.01,0.053529602289199826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,2,power_law_1.2,0.04561919867992401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,2,power_law_1.01,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,2,power_law_1.2,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,2,power_law_1.01,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,2,power_law_1.2,0.048876801133155824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,2,power_law_1.01,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,2,power_law_1.2,0.052160000801086424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,2,power_law_1.01,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,2,power_law_1.2,0.05911679863929749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,2,power_law_1.01,0.08179200291633607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,2,power_law_1.2,0.06668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,2,power_law_1.01,0.09162240028381348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,2,power_law_1.2,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,2,power_law_1.01,0.1049407958984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,2,power_law_1.2,0.07428479790687562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,2,power_law_1.01,0.11763199567794799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,2,power_law_1.2,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,2,power_law_1.01,0.16064000129699707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,2,power_law_1.2,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,2,power_law_1.01,0.18318079710006713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,2,power_law_1.2,0.12527999877929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,2,power_law_1.01,0.24788479804992675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,2,power_law_1.2,0.15557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,2,power_law_1.01,0.32508800029754636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,2,power_law_1.2,0.20084478855133056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,2,power_law_1.01,0.480947208404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,2,power_law_1.2,0.25798399448394777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,2,power_law_1.01,0.5665535926818848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,2,power_law_1.2,0.36652801036834715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,2,power_law_1.01,0.7359231948852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,2,power_law_1.2,0.4978047847747803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,2,power_law_1.01,1.254265594482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,2,power_law_1.2,0.6466879844665527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,2,power_law_1.01,2.486150360107422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,2,power_law_1.2,0.8203455924987793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,2,power_law_1.2,1.1056511878967286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,2,power_law_1.2,2.607372856140137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,1,power_law_1.01,0.01809920072555542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,1,power_law_1.01,0.018105599284172057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,1,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,1,power_law_1.01,0.021568000316619873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,1,power_law_1.2,0.01831679940223694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,1,power_law_1.01,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,1,power_law_1.2,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,1,power_law_1.01,0.027116799354553224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,1,power_law_1.2,0.017958399653434754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,1,power_law_1.01,0.024249599874019624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,1,power_law_1.2,0.01774719953536987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,1,power_law_1.01,0.03182719945907593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,1,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,1,power_law_1.2,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,1,power_law_1.01,0.028748801350593566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,1,power_law_1.2,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,1,power_law_1.01,0.027929601073265076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,1,power_law_1.2,0.02369280010461807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,1,power_law_1.01,0.03059200048446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,1,power_law_1.2,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,1,power_law_1.01,0.029158401489257812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,1,power_law_1.2,0.02451840043067932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,1,power_law_1.01,0.029516801238059998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,1,power_law_1.2,0.02655999958515167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,1,power_law_1.01,0.03919360041618347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,1,power_law_1.2,0.028825598955154418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,1,power_law_1.01,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,1,power_law_1.2,0.02861439883708954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,1,power_law_1.01,0.04266240000724793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,1,power_law_1.2,0.029420799016952513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,1,power_law_1.01,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,1,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,1,power_law_1.01,0.05311999917030334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,1,power_law_1.2,0.04131200015544891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.01,0.0639743983745575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,1,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.01,0.08138239979743958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,1,power_law_1.2,0.0521664023399353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.01,0.10042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.2,0.05605120062828064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.01,0.13320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.2,0.07856640219688416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.01,0.1692415952682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.2,0.09312639832496643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.01,0.23600640296936035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.2,0.12874879837036132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.01,0.3072704076766968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.2,0.16460800170898438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.01,0.4502272129058838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.2,0.23546240329742432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.01,0.5935935974121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.2,0.3071295976638794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,1,power_law_1.01,0.733465576171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.2,0.44946560859680174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,1,power_law_1.01,1.1633343696594238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.2,0.5903744220733642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,1,power_law_1.01,2.3032768249511717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,1,power_law_1.2,0.7322944164276123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,1,power_law_1.2,1.1674559593200684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,1,power_law_1.2,2.3111103057861326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,1,power_law_1.01,0.03939839899539947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,1,power_law_1.01,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,1,power_law_1.01,0.03978880047798157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,1,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,1,power_law_1.01,0.045337599515914914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,1,power_law_1.2,0.03904640078544617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,1,power_law_1.01,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,1,power_law_1.2,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,1,power_law_1.01,0.04535039961338043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,1,power_law_1.2,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,1,power_law_1.01,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,1,power_law_1.2,0.044588801264762876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,1,power_law_1.01,0.04677119851112366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,1,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,1,power_law_1.01,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,1,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,1,power_law_1.01,0.046367999911308286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,1,power_law_1.01,0.04922879934310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,1,power_law_1.01,0.05084800124168396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,1,power_law_1.01,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,1,power_law_1.01,0.0559935986995697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,1,power_law_1.01,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,1,power_law_1.01,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,1,power_law_1.01,0.0692799985408783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,1,power_law_1.01,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.01,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.01,0.11026560068130493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.01,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.01,0.16145919561386107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.01,0.19525760412216187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.01,0.26898560523986814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.01,0.34374399185180665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.01,0.4932415962219238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.01,0.6275904178619385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,1,power_law_1.01,0.7744128227233886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,4,power_law_1.01,0.0914687991142273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,4,power_law_1.01,0.09536640048027038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,1,power_law_1.01,1.2104512214660645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,4,power_law_1.01,0.11500799655914307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,1,power_law_1.01,2.429209518432617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,4,power_law_1.01,0.13366400003433226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,4,power_law_1.01,0.16581759452819825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,4,power_law_1.01,0.2153791904449463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,4,power_law_1.01,0.3106112003326416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,8,power_law_1.01,0.011462400108575821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,4,power_law_1.01,0.3681600093841553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,8,power_law_1.01,0.012985600531101227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,4,power_law_1.01,0.5109055995941162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,8,power_law_1.01,0.013100799918174744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,4,power_law_1.01,0.8092991828918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,8,power_law_1.01,0.012870399653911591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,4,power_law_1.01,1.0321151733398437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,8,power_law_1.01,0.012985600531101227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,4,power_law_1.01,1.6547008514404298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,8,power_law_1.01,0.015647999942302704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,8,power_law_1.01,0.014150400459766389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,4,power_law_1.01,2.875519943237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,8,power_law_1.01,0.01605760008096695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,8,power_law_1.01,0.014214399456977844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,8,power_law_1.01,0.014412799477577209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,8,power_law_1.01,0.01687040030956268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,8,power_law_1.01,0.014003199338912965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,8,power_law_1.01,0.013804799318313599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,8,power_law_1.01,0.016051200032234193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,8,power_law_1.01,0.016659200191497803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,2,8,power_law_1.2,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,8,power_law_1.01,0.017689600586891174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,2,8,power_law_1.2,0.024102400243282317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,8,power_law_1.01,0.020351999998092653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,2,8,power_law_1.2,0.02449920028448105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,8,power_law_1.01,0.02465279996395111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,2,8,power_law_1.2,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,8,power_law_1.01,0.02526719868183136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,2,8,power_law_1.2,0.03268480002880096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,8,power_law_1.01,0.03345920145511627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,2,8,power_law_1.2,0.04744960069656372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,8,power_law_1.01,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,2,8,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,2,8,power_law_1.2,0.049881601333618165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,8,power_law_1.01,0.04755840003490448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,2,8,power_law_1.2,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,8,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,2,8,power_law_1.2,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,8,power_law_1.01,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,2,power_law_1.2,0.05230720043182373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,2,8,power_law_1.2,0.05256959795951843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,8,power_law_1.01,0.10736639499664306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,2,power_law_1.2,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,2,8,power_law_1.2,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,8,power_law_1.01,0.15245440006256103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,2,power_law_1.2,0.07790719866752624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,2,8,power_law_1.2,0.06424319744110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,8,power_law_1.01,0.197107195854187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,2,power_law_1.2,0.09123839735984803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,2,8,power_law_1.2,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,8,power_law_1.01,0.24031360149383546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,2,power_law_1.2,0.12789119482040406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,2,8,power_law_1.2,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,2,power_law_1.2,0.16393599510192872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,8,power_law_1.01,0.37200639247894285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,2,8,power_law_1.2,0.10444799661636353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,2,power_law_1.2,0.24666879177093506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,8,power_law_1.01,0.722815990447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,2,8,power_law_1.2,0.12525440454483033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,2,power_law_1.2,0.3105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,2,8,power_law_1.2,0.17768319845199584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,2,power_law_1.2,0.45475201606750487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,2,8,power_law_1.2,0.22602241039276122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,2,power_law_1.2,0.6001471996307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,2,8,power_law_1.2,0.3247488021850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,2,power_law_1.2,0.7482175827026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,2,8,power_law_1.2,0.41710720062255857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,8,power_law_1.01,0.05331839919090271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,2,power_law_1.2,1.188326358795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,2,8,power_law_1.2,0.6137216091156006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,8,power_law_1.01,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,2,8,power_law_1.2,0.8035648345947266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,2,power_law_1.2,2.3481088638305665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,8,power_law_1.01,0.049439999461174014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,2,8,power_law_1.2,1.1883839607238769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,8,power_law_1.01,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,8,power_law_1.01,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,2,8,power_law_1.2,1.5723711967468261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,8,power_law_1.01,0.05127679705619812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,2,8,power_law_1.2,2.342425537109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,8,power_law_1.01,0.05251200199127197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,2,8,power_law_1.2,3.108582305908203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,2,8,power_law_1.2,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,8,power_law_1.01,0.051481598615646364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,2,8,power_law_1.2,0.052928000688552856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,2,8,power_law_1.2,3.8774017333984374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,8,power_law_1.01,0.0500544011592865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,2,8,power_law_1.2,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,2,8,power_law_1.2,6.185055923461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,8,power_law_1.01,0.057017600536346434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,2,8,power_law_1.2,0.05130879878997803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,8,power_law_1.01,0.05761920213699341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,2,8,power_law_1.2,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,2,8,power_law_1.2,12.334003448486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,8,power_law_1.01,0.061324799060821535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,2,8,power_law_1.2,0.05231999754905701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,8,power_law_1.01,0.06602240204811097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,2,8,power_law_1.2,0.05189120173454285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,8,power_law_1.01,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,2,8,power_law_1.2,0.052102398872375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,8,power_law_1.01,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,2,8,power_law_1.2,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,8,power_law_1.01,0.09122560024261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,2,8,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,4,power_law_1.01,0.021433599293231964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,8,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,2,8,power_law_1.2,0.06255360245704651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,4,power_law_1.01,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,8,power_law_1.01,0.11415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,2,8,power_law_1.2,0.06684799790382386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,4,power_law_1.01,0.022047999501228332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,8,power_law_1.01,0.12438399791717529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,2,8,power_law_1.2,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,4,power_law_1.01,0.0212351992726326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,2,8,power_law_1.2,0.07648640275001525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,8,power_law_1.01,0.15368319749832154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,4,power_law_1.01,0.023052799701690673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,2,8,power_law_1.2,0.08631680011749268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,8,power_law_1.01,0.1897279977798462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,4,power_law_1.01,0.031065601110458373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,2,8,power_law_1.2,0.088755202293396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,8,power_law_1.01,0.2698048114776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,4,power_law_1.01,0.02961280047893524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,2,8,power_law_1.2,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,8,power_law_1.01,0.3590912103652954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,4,power_law_1.01,0.03207040131092072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,2,8,power_law_1.2,0.12174719572067261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,8,power_law_1.01,0.4830016136169434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,4,power_law_1.01,0.033504000306129454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,2,8,power_law_1.2,0.13115520477294923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,8,power_law_1.01,0.5944128036499023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,4,power_law_1.01,0.034329599142074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,2,8,power_law_1.2,0.16556799411773682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,8,power_law_1.01,0.9292672157287598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,4,power_law_1.01,0.03514240086078644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,2,8,power_law_1.2,0.1872704029083252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,8,power_law_1.01,1.2723008155822755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,4,power_law_1.01,0.05051519870758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,2,8,power_law_1.2,0.2667455911636353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,8,power_law_1.01,1.5903488159179688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,4,power_law_1.01,0.04865919947624207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,2,8,power_law_1.2,0.349068808555603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,8,power_law_1.01,2.4718080520629884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,4,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,2,8,power_law_1.2,0.42566399574279784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,4,power_law_1.01,0.0611519992351532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,2,8,power_law_1.2,0.5911295890808106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,8,power_law_1.01,5.786700820922851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,4,power_law_1.01,0.06709120273590088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,2,8,power_law_1.2,0.9546496391296386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,4,power_law_1.01,0.09044479727745056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,2,8,power_law_1.2,1.2722944259643554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,4,power_law_1.01,0.10540159940719604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,2,8,power_law_1.2,1.610438346862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,4,power_law_1.01,0.1359231948852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,4,power_law_1.2,0.011135999858379365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,2,8,power_law_1.2,2.430438423156738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,4,power_law_1.01,0.21454720497131347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,4,power_law_1.2,0.013094399869441987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,4,power_law_1.01,0.22766079902648925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,4,power_law_1.2,0.014028799533843995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,2,8,power_law_1.2,5.814144134521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,4,power_law_1.01,0.3450047969818115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,4,power_law_1.2,0.012595200538635254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,4,power_law_1.01,0.4629695892333984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,4,power_law_1.2,0.012563200294971466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,4,power_law_1.01,0.6446784019470215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,4,power_law_1.2,0.01605760008096695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,4,power_law_1.01,1.0235136032104493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,4,power_law_1.2,0.016748799383640288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,4,power_law_1.01,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,4,power_law_1.2,0.01626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,4,power_law_1.01,1.3481216430664062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,4,power_law_1.01,0.04780800044536591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,4,power_law_1.2,0.017459200322628023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,4,power_law_1.01,1.8345151901245118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,4,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,4,power_law_1.2,0.016761599481105803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,4,power_law_1.01,2.578771209716797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,4,power_law_1.01,0.04718720018863678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,4,power_law_1.2,0.017075200378894807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,4,power_law_1.01,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,4,power_law_1.01,4.0570110321044925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,4,power_law_1.2,0.015974399447441102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,4,power_law_1.01,0.049856001138687135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,4,power_law_1.2,0.014617599546909332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,4,power_law_1.01,6.6448509216308596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,4,power_law_1.01,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,4,power_law_1.2,0.016467200219631196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,4,power_law_1.01,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,4,power_law_1.2,0.017484800517559053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,4,power_law_1.01,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,4,power_law_1.2,0.018508799374103546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,4,power_law_1.01,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,4,power_law_1.2,0.02178560048341751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,4,power_law_1.01,0.05825279951095581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,4,power_law_1.2,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,4,power_law_1.2,0.025900799036026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,4,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,4,power_law_1.2,0.046419200301170346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,4,power_law_1.2,0.026707199215888978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,4,power_law_1.01,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,4,power_law_1.2,0.046419200301170346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,4,power_law_1.2,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,4,power_law_1.01,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,4,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,4,power_law_1.2,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,4,power_law_1.01,0.07710719704627991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,4,power_law_1.2,0.0474368005990982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,4,power_law_1.2,0.051686400175094606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,4,power_law_1.01,0.08446720242500305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,4,power_law_1.2,0.0474368005990982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,4,power_law_1.01,0.09062399864196777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,4,power_law_1.2,0.06313599944114685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,4,power_law_1.2,0.04865919947624207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,4,power_law_1.01,0.09676160216331482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,4,power_law_1.2,0.091430401802063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,4,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,4,power_law_1.01,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,4,power_law_1.2,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,4,power_law_1.2,0.1176192045211792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,4,power_law_1.01,0.14467840194702147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,4,power_law_1.2,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,4,power_law_1.2,0.1688447952270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,4,power_law_1.2,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,4,power_law_1.01,0.15530240535736084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,4,power_law_1.2,0.21716480255126952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,4,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,4,power_law_1.01,0.24174079895019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,4,power_law_1.2,0.2667263984680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,4,power_law_1.2,0.0630016028881073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,4,power_law_1.01,0.2698048114776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,4,power_law_1.2,0.41541118621826173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,4,power_law_1.2,0.06711680293083191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,4,power_law_1.01,0.3922816038131714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,4,power_law_1.2,0.8084223747253418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,4,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,4,power_law_1.01,0.5350207805633544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,4,power_law_1.2,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,4,power_law_1.01,0.7285376071929932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,4,power_law_1.2,0.08737279772758484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,4,power_law_1.01,1.2194560050964356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,4,power_law_1.2,0.10457600355148315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,4,power_law_1.01,1.2882752418518066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,4,power_law_1.2,0.12464640140533448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,2,power_law_1.01,0.020563200116157532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,4,power_law_1.01,2.055865669250488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,4,power_law_1.2,0.14430079460144044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,2,power_law_1.01,0.01973759979009628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,4,power_law_1.2,0.18957439661026002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,4,power_law_1.01,4.267103958129883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,2,power_law_1.01,0.020147199928760528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,1,power_law_1.2,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,4,power_law_1.2,0.2565376043319702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,2,power_law_1.01,0.01992959976196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,1,power_law_1.2,0.04640640020370483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,4,power_law_1.2,0.25817599296569826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,2,power_law_1.01,0.02096640020608902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,1,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,4,power_law_1.2,0.447814416885376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,2,power_law_1.01,0.024243199825286867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,2,power_law_1.2,0.011673600226640702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,1,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,4,power_law_1.2,0.5153984069824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,2,power_law_1.01,0.024243199825286867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,2,power_law_1.2,0.013312000036239623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,1,power_law_1.2,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,4,power_law_1.2,0.894495964050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,2,power_law_1.01,0.024633599817752837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,2,power_law_1.2,0.01340160071849823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,1,power_law_1.2,0.05502079725265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,4,power_law_1.2,1.036620807647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,2,power_law_1.01,0.026291200518608095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,2,power_law_1.2,0.01377280056476593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,1,power_law_1.2,0.05237119793891907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,4,power_law_1.2,1.3530431747436524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,2,power_law_1.01,0.026713600754737853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,2,power_law_1.2,0.01401599943637848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,1,power_law_1.2,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,4,power_law_1.2,2.2234432220458986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,2,power_law_1.01,0.02691200077533722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,2,power_law_1.2,0.015647999942302704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,1,power_law_1.2,0.06747519969940186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,2,power_law_1.2,0.01462399959564209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,1,power_law_1.2,0.07162240147590637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,4,power_law_1.2,5.126476669311524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,2,power_law_1.2,0.015251199901103973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,1,power_law_1.2,0.08144639730453491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,2,power_law_1.2,0.014009599387645722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.2,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,2,power_law_1.2,0.01483519971370697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.2,0.10990719795227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,2,power_law_1.2,0.016044799983501435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.2,0.12792960405349732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,2,power_law_1.01,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,2,power_law_1.2,0.01483519971370697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.2,0.1615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,2,power_law_1.01,0.04273920059204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,2,power_law_1.2,0.015238399803638458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.2,0.19487359523773193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,2,power_law_1.01,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,2,power_law_1.2,0.016672000288963318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.2,0.27107839584350585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,2,power_law_1.01,0.046828800439834596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,2,power_law_1.2,0.017689600586891174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.2,0.34276480674743653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,2,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,2,power_law_1.2,0.018323199450969697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.2,0.4990079879760742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,2,power_law_1.01,0.05111680030822754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,2,power_law_1.2,0.020160000026226043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.2,0.6341887950897217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,2,power_law_1.01,0.05051519870758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,2,power_law_1.2,0.023443199694156647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,1,power_law_1.2,0.783903980255127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,2,power_law_1.01,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,2,power_law_1.2,0.025887998938560485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,2,power_law_1.01,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,1,power_law_1.2,1.2195136070251464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,2,power_law_1.2,0.03245440125465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,2,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,2,power_law_1.2,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,1,power_law_1.2,2.4255807876586912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,2,power_law_1.01,0.05685120224952698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,2,power_law_1.2,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,2,power_law_1.01,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,2,power_law_1.2,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,2,power_law_1.01,0.06259199976921082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,2,power_law_1.2,0.08099200129508972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,2,power_law_1.01,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,2,power_law_1.2,0.10372480154037475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,2,power_law_1.01,0.07672960162162781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,2,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,2,power_law_1.2,0.1438655972480774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,2,power_law_1.01,0.0756991982460022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,2,power_law_1.2,0.04254080057144165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,2,power_law_1.2,0.18542079925537108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,2,power_law_1.01,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,2,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,2,power_law_1.2,0.22741119861602782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,2,power_law_1.01,0.09618560075759888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,2,power_law_1.2,0.04784640073776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,2,power_law_1.2,0.3509056091308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,2,power_law_1.01,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,2,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,2,power_law_1.2,0.677785587310791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,2,power_law_1.01,0.1260800004005432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,2,power_law_1.2,0.048607999086380006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,2,power_law_1.01,0.1510591983795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,2,power_law_1.2,0.048256000876426695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,2,power_law_1.01,0.19775999784469606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,2,power_law_1.2,0.050937598943710326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,2,power_law_1.01,0.23052799701690674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,2,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,2,power_law_1.2,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,2,power_law_1.01,0.3685760021209717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,1,power_law_1.01,0.019756799936294554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,2,power_law_1.2,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,2,power_law_1.01,0.4547840118408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,1,power_law_1.01,0.020160000026226043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,2,power_law_1.2,0.06157439947128296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,2,power_law_1.01,0.6397312164306641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,1,power_law_1.01,0.02056960016489029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,2,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,2,power_law_1.01,0.7396607875823975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,1,power_law_1.01,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,2,power_law_1.2,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,2,power_law_1.01,1.0034432411193848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,1,power_law_1.01,0.023647999763488768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,2,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,1,power_law_1.01,0.024672000110149382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,2,power_law_1.01,1.663315200805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,2,power_law_1.2,0.07754240036010743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,1,power_law_1.01,0.026719999313354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,2,power_law_1.01,3.7565567016601564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,2,power_law_1.2,0.0855296015739441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,1,power_law_1.01,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,2,power_law_1.2,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,1,power_law_1.01,0.02874239981174469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,2,power_law_1.2,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,1,power_law_1.01,0.02876800000667572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,2,power_law_1.2,0.13181439638137818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,1,power_law_1.01,0.02794240117073059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,2,power_law_1.2,0.16090240478515624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,1,power_law_1.01,0.03245440125465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,1,power_law_1.2,0.01875839978456497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,2,power_law_1.2,0.19367680549621583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,1,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,1,power_law_1.2,0.01875839978456497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,2,power_law_1.2,0.255731201171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,1,power_law_1.01,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,1,power_law_1.2,0.020000000298023225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,1,power_law_1.01,0.04678399860858917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,2,power_law_1.2,0.3906879901885986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,1,power_law_1.2,0.019993600249290467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,1,power_law_1.01,0.0486272007226944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,2,power_law_1.2,0.49696640968322753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,1,power_law_1.2,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,1,power_law_1.01,0.05189759731292724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,2,power_law_1.2,0.6313087940216064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,1,power_law_1.2,0.023686400055885314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,1,power_law_1.01,0.06726400256156921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,1,power_law_1.2,0.025727999210357667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,2,power_law_1.2,0.8133952140808105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.01,0.08281599879264831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,1,power_law_1.2,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,2,power_law_1.2,1.0411328315734862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.01,0.11642240285873413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,1,power_law_1.2,0.027987200021743774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,2,power_law_1.2,1.742367935180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.01,0.1371072053909302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,1,power_law_1.2,0.02818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,2,power_law_1.2,3.895840072631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.01,0.19893120527267455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,1,power_law_1.2,0.026950401067733765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.01,0.2519999980926514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,1,power_law_1.2,0.031667199730873105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.01,0.36400001049041747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,1,power_law_1.2,0.03185920119285583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,1,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.01,0.46826882362365724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,1,power_law_1.2,0.04620800018310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.01,0.6945407867431641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,1,power_law_1.01,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,1,power_law_1.2,0.048256000876426695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.01,0.9161664009094238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,1,power_law_1.01,0.042335999011993405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,1,power_law_1.2,0.051123201847076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,1,power_law_1.01,1.1408191680908204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,1,power_law_1.01,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,1,power_law_1.2,0.06668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,1,power_law_1.01,1.8074752807617187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,1,power_law_1.01,0.051526397466659546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.2,0.08247039914131164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,1,power_law_1.01,3.5586814880371094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,1,power_law_1.01,0.05237119793891907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.2,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,1,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.2,0.13550080060958863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,1,power_law_1.01,0.05358080267906189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.2,0.19714560508728027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,1,power_law_1.01,0.053395199775695804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.2,0.24876799583435058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,1,power_law_1.01,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.2,0.3620160102844238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,1,power_law_1.01,0.054604798555374146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,1,power_law_1.2,0.04289920032024384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.2,0.4678976058959961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,1,power_law_1.2,0.043110400438308716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.2,0.6950143814086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,1,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.2,0.9133248329162598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,1,power_law_1.2,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,1,power_law_1.2,1.1392383575439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,1,power_law_1.2,0.053958398103713986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,1,power_law_1.2,1.8042047500610352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,1,power_law_1.2,0.053548800945281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,1,power_law_1.2,3.571014404296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,1,power_law_1.2,0.05416319966316223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,1,power_law_1.2,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,1,power_law_1.2,0.057158398628234866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,1,power_law_1.2,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,1,power_law_1.2,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,1,power_law_1.2,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,1,power_law_1.2,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,1,power_law_1.2,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,16,power_law_1.01,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,1,power_law_1.2,0.07710080146789551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,16,power_law_1.01,0.02449920028448105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,1,power_law_1.2,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,16,power_law_1.01,0.024512000381946564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,1,power_law_1.2,0.08447359800338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,1,power_law_1.2,0.10331519842147827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,16,power_law_1.01,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.2,0.1145792007446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,16,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.2,0.13404799699783326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,16,power_law_1.01,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.2,0.1561535954475403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.2,0.20284159183502198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,16,power_law_1.01,0.04497919976711273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.2,0.24277760982513427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,16,power_law_1.01,0.05275520086288452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.2,0.3388351917266846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,16,power_law_1.01,0.0609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.2,0.42853760719299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.2,0.6144959926605225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,16,power_law_1.01,0.06828160285949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.2,0.7900032043457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,16,power_law_1.01,0.08511999845504761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,1,power_law_1.2,0.9780096054077149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,16,power_law_1.01,0.09987199902534485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,1,power_law_1.2,1.5493632316589356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,16,power_law_1.01,0.11646080017089844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,1,power_law_1.2,3.107308769226074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,16,power_law_1.01,0.1477311968803406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,16,power_law_1.01,0.10682879686355591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,16,power_law_1.01,0.12232320308685303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,16,power_law_1.01,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,16,power_law_1.01,0.13262079954147338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.01,0.16745599508285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.01,0.22156159877777098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.01,0.2882879972457886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.01,0.42060160636901855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.01,0.5539199829101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,16,power_law_1.2,0.052723199129104614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.01,0.8236479759216309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,16,power_law_1.2,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.01,1.0876288414001465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,16,power_law_1.2,0.04371199905872345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.01,1.628486442565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,16,power_law_1.2,0.04822399914264679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.01,2.1607616424560545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,16,power_law_1.2,0.057030397653579715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,16,power_law_1.01,2.685260772705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,16,power_law_1.2,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,16,power_law_1.2,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,16,power_law_1.01,4.267071914672852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,16,power_law_1.2,0.07710080146789551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,16,power_law_1.2,0.08570240139961242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,16,power_law_1.01,8.52042236328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,16,power_law_1.2,0.09859840273857116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,16,power_law_1.2,0.11253119707107544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,16,power_law_1.2,0.12341120243072509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,16,power_law_1.2,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,16,power_law_1.01,0.09761279821395874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,16,power_law_1.2,0.1704767942428589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,16,power_law_1.01,0.14206080436706542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,16,power_law_1.2,0.13527040481567382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,16,power_law_1.01,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,16,power_law_1.2,0.15696640014648439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,16,power_law_1.01,0.07568640112876893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,16,power_law_1.2,0.1835904002189636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,16,power_law_1.01,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,16,power_law_1.2,0.16270079612731933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,16,power_law_1.01,0.10805759429931641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.2,0.20551040172576904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,16,power_law_1.01,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,2,power_law_1.01,0.03182719945907593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.2,0.28005759716033934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,16,power_law_1.01,0.12014080286026001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,2,power_law_1.01,0.03203839957714081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.2,0.3468224048614502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,16,power_law_1.01,0.11953279972076417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,2,power_law_1.01,0.033055999875068666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,2,power_law_1.01,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.2,0.4854720115661621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,16,power_law_1.01,0.12260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,2,power_law_1.01,0.04759680032730103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,16,power_law_1.01,0.12567039728164672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.2,0.5854144096374512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,2,power_law_1.01,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,16,power_law_1.01,0.12977919578552247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.2,0.9145088195800781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,2,power_law_1.01,0.06520959734916687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,16,power_law_1.01,0.1281280040740967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,2,power_law_1.01,0.08036479949951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.2,1.379206371307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,2,power_law_1.01,0.11107840538024902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,16,power_law_1.01,0.13304959535598754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.2,2.1328704833984373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,2,power_law_1.01,0.13176319599151612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,16,power_law_1.01,0.14205440282821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.2,2.747270393371582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,2,power_law_1.01,0.19300479888916017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,16,power_law_1.01,0.13672959804534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,2,power_law_1.01,0.24461441040039061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,16,power_law_1.2,3.4216766357421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,16,power_law_1.01,0.15208959579467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,2,power_law_1.01,0.35561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,2,power_law_1.01,0.4666175842285156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,16,power_law_1.01,0.16654720306396484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,16,power_law_1.2,5.229036712646485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,2,power_law_1.01,0.6929279804229737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.01,0.18097920417785646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,2,power_law_1.01,0.916966438293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.01,0.21620481014251708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,16,power_law_1.2,11.684537506103515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,2,power_law_1.01,1.1424448013305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.01,0.22725119590759277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,2,power_law_1.01,1.8135744094848634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.01,0.2792704105377197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,2,power_law_1.01,3.5951297760009764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.01,0.3429631948471069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,16,power_law_1.2,0.09818879961967468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.01,0.4314176082611084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,16,power_law_1.2,0.1422271966934204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.01,0.5325632095336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,16,power_law_1.2,0.0736191987991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.01,0.746553611755371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,16,power_law_1.2,0.07994880080223084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.01,0.9739520072937011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,16,power_law_1.2,0.09962239861488342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,8,power_law_1.01,0.02588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,16,power_law_1.01,1.1936896324157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,16,power_law_1.2,0.10085120201110839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,8,power_law_1.01,0.027935999631881713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,16,power_law_1.01,1.8377920150756837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,16,power_law_1.2,0.11027840375900269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,8,power_law_1.01,0.031219199299812317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,16,power_law_1.2,0.11765120029449463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,8,power_law_1.01,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,16,power_law_1.01,3.6087039947509765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,16,power_law_1.2,0.12112640142440796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,8,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,16,power_law_1.2,0.12256640195846558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,8,power_law_1.01,0.04757120013237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,16,power_law_1.2,0.12543359994888306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,8,power_law_1.01,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,16,power_law_1.2,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,8,power_law_1.01,0.06909440159797668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,16,power_law_1.2,0.12543359994888306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,8,power_law_1.01,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,8,power_law_1.2,0.0253248006105423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,16,power_law_1.2,0.13056000471115112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,8,power_law_1.01,0.07748479843139648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,8,power_law_1.2,0.02736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,16,power_law_1.2,0.14139519929885863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,8,power_law_1.01,0.09366400241851806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,8,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,16,power_law_1.2,0.14345599412918092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,8,power_law_1.01,0.11107840538024902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,8,power_law_1.2,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,16,power_law_1.2,0.16004480123519899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,8,power_law_1.01,0.12787840366363526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,8,power_law_1.2,0.045184001326560974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,16,power_law_1.2,0.17950079441070557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,8,power_law_1.01,0.1624959945678711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,8,power_law_1.2,0.04744960069656372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.2,0.19548799991607665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,8,power_law_1.01,0.11965440511703491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,8,power_law_1.2,0.05767679810523987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.2,0.2232896089553833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,8,power_law_1.01,0.13689600229263305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,8,power_law_1.2,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.2,0.2378688097000122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,8,power_law_1.01,0.1741696000099182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,8,power_law_1.2,0.06977279782295227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.2,0.315283203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,8,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,8,power_law_1.01,0.145907199382782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.2,0.3668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,8,power_law_1.2,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,8,power_law_1.01,0.18481279611587526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.2,0.4973311901092529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,8,power_law_1.2,0.11113599538803101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,8,power_law_1.01,0.26061439514160156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.2,0.6189375877380371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,8,power_law_1.2,0.12750719785690307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,8,power_law_1.01,0.3345151901245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.2,0.8801216125488281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,8,power_law_1.2,0.16232320070266723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,8,power_law_1.01,0.49324798583984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.2,1.1420479774475099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,8,power_law_1.2,0.11990400552749633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,8,power_law_1.01,0.6437695980072021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,16,power_law_1.2,1.33374080657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,8,power_law_1.2,0.13754240274429322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,8,power_law_1.01,0.9563008308410644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,16,power_law_1.2,2.1259008407592774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,8,power_law_1.2,0.17503360509872437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,8,power_law_1.01,1.269222354888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,8,power_law_1.2,0.1471743941307068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,16,power_law_1.2,4.950713729858398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,8,power_law_1.01,1.8973503112792969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,8,power_law_1.2,0.18547840118408204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,8,power_law_1.2,0.26207358837127687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,8,power_law_1.01,2.5197376251220702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,8,power_law_1.2,0.3349695920944214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,8,power_law_1.01,3.1466304779052736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,8,power_law_1.2,0.49367680549621584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,8,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,8,power_law_1.01,5.019513702392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,8,power_law_1.2,0.6450496196746827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,1,power_law_1.01,0.058719998598098753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,8,power_law_1.01,0.11027840375900269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,1,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,8,power_law_1.2,0.9551103591918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,8,power_law_1.01,0.07955200076103211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,8,power_law_1.01,10.017049407958984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,1,power_law_1.01,0.06690559983253479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,8,power_law_1.2,1.2684608459472657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,1,power_law_1.01,0.06176000237464905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,8,power_law_1.01,0.07996159791946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,8,power_law_1.2,1.8937088012695313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,1,power_law_1.01,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,8,power_law_1.01,0.09549440145492553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,1,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,8,power_law_1.2,2.524684715270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,8,power_law_1.01,0.10618239641189575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,1,power_law_1.01,0.08901119828224183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,1,power_law_1.01,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,8,power_law_1.2,0.07831680178642272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,8,power_law_1.01,0.12870399951934813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,8,power_law_1.2,3.139295959472656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.01,0.11113599538803101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,8,power_law_1.2,0.11109119653701782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,8,power_law_1.01,0.12952959537506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,8,power_law_1.2,5.0142463684082035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.01,0.13407360315322875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,8,power_law_1.2,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,8,power_law_1.01,0.130348801612854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.01,0.15619200468063354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.01,0.1998271942138672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,8,power_law_1.01,0.1360640048980713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,8,power_law_1.2,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,8,power_law_1.2,10.028569793701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.01,0.2407680034637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,8,power_law_1.01,0.14017280340194702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,8,power_law_1.2,0.09756799936294555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.01,0.3370368003845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,8,power_law_1.01,0.1422271966934204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,8,power_law_1.2,0.09919999837875366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.01,0.4232448101043701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,8,power_law_1.01,0.14714239835739135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.01,0.6124864101409913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,8,power_law_1.2,0.1254464030265808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.01,0.7834752082824707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,8,power_law_1.01,0.1438655972480774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,8,power_law_1.2,0.13075200319290162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,4,power_law_1.01,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,1,power_law_1.01,0.9723135948181152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,8,power_law_1.01,0.1553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,8,power_law_1.2,0.13197439908981323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,4,power_law_1.01,0.02223999947309494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,1,power_law_1.01,1.5412480354309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,8,power_law_1.01,0.16186879873275756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,4,power_law_1.01,0.024089600145816802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,8,power_law_1.2,0.1344383955001831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,1,power_law_1.01,3.097932815551758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,8,power_law_1.01,0.17048319578170776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,4,power_law_1.01,0.026950401067733765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,8,power_law_1.2,0.13626879453659058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,8,power_law_1.01,0.18994560241699218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,4,power_law_1.01,0.03126400113105774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,8,power_law_1.2,0.1381183981895447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,8,power_law_1.01,0.20223360061645507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,4,power_law_1.01,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,8,power_law_1.2,0.14465919733047486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,8,power_law_1.01,0.2466752052307129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,4,power_law_1.2,0.020614400506019592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,4,power_law_1.01,0.05315840244293213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,8,power_law_1.2,0.14917759895324706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,4,power_law_1.2,0.021427200734615327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,8,power_law_1.01,0.2569024085998535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,4,power_law_1.01,0.061766397953033444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,8,power_law_1.2,0.15285760164260864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,4,power_law_1.2,0.02245119959115982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,8,power_law_1.01,0.31547520160675047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,4,power_law_1.01,0.06914560198783874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,8,power_law_1.2,0.16269439458847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,4,power_law_1.2,0.025740799307823182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,8,power_law_1.01,0.37793920040130613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,4,power_law_1.01,0.07651839852333069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,8,power_law_1.2,0.1692415952682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,4,power_law_1.2,0.02861439883708954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,4,power_law_1.01,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,8,power_law_1.01,0.47725439071655273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,8,power_law_1.2,0.19749759435653685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,4,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,4,power_law_1.01,0.0949504017829895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,8,power_law_1.01,0.5907135963439941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,8,power_law_1.2,0.2120512008666992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,4,power_law_1.2,0.041119998693466185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,4,power_law_1.01,0.10969599485397338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,8,power_law_1.2,0.25729920864105227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,8,power_law_1.01,0.8620863914489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,4,power_law_1.2,0.04622719883918762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,4,power_law_1.01,0.13468159437179567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,8,power_law_1.2,0.26181759834289553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,8,power_law_1.01,1.0124223709106446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,4,power_law_1.2,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,4,power_law_1.01,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,8,power_law_1.2,0.33390719890594484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,8,power_law_1.01,1.2591936111450195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,4,power_law_1.2,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,4,power_law_1.01,0.11891839504241944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,8,power_law_1.2,0.38163840770721436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,8,power_law_1.01,1.95797119140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,4,power_law_1.2,0.06811519861221313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,4,power_law_1.01,0.14780160188674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,8,power_law_1.2,0.4887231826782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,4,power_law_1.2,0.070796799659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,4,power_law_1.01,0.1379520058631897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,8,power_law_1.01,3.63570556640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,8,power_law_1.2,0.6333119869232178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,4,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,4,power_law_1.01,0.17072639465332032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,8,power_law_1.2,0.9075519561767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,4,power_law_1.2,0.09556480050086975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,4,power_law_1.01,0.23668479919433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,4,power_law_1.2,0.07672960162162781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,4,power_law_1.01,0.2987391948699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,4,power_law_1.2,0.08675199747085571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,4,power_law_1.01,0.42979841232299804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,4,power_law_1.2,0.10439039468765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,4,power_law_1.01,0.08529279828071594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,4,power_law_1.01,0.5387519836425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,4,power_law_1.2,0.09946879744529724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,4,power_law_1.01,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,4,power_law_1.01,0.8310079574584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,4,power_law_1.2,0.12117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,4,power_law_1.01,0.07627519965171814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,4,power_law_1.01,1.0827072143554688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,4,power_law_1.2,0.1604864001274109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,4,power_law_1.01,0.08713600039482117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,4,power_law_1.01,1.6055551528930665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,4,power_law_1.2,0.1922368049621582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,4,power_law_1.01,0.10700160264968872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,4,power_law_1.01,2.152179145812988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,4,power_law_1.2,0.27946879863739016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,4,power_law_1.01,0.12338559627532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,4,power_law_1.01,2.694655990600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,4,power_law_1.2,0.3556544065475464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,4,power_law_1.01,0.15326720476150513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,4,power_law_1.01,4.228224182128907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,4,power_law_1.01,0.15736960172653197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,4,power_law_1.2,0.5195136070251465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,4,power_law_1.01,0.158188796043396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,4,power_law_1.2,0.6794559955596924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,4,power_law_1.01,8.692658996582031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,4,power_law_1.01,0.16146559715270997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,4,power_law_1.2,1.0087807655334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,4,power_law_1.01,0.16885119676589966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,4,power_law_1.2,1.3358464241027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,4,power_law_1.01,0.17089279890060424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,4,power_law_1.2,1.6555328369140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,4,power_law_1.01,0.18052480220794678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,4,power_law_1.2,2.6336511611938476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,4,power_law_1.2,0.08510720133781433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,4,power_law_1.01,0.18154879808425903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,4,power_law_1.2,0.08902400135993957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,4,power_law_1.01,0.1876736044883728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,4,power_law_1.2,5.226425552368164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,4,power_law_1.2,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,4,power_law_1.01,0.1929919958114624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,4,power_law_1.2,0.08511999845504761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,4,power_law_1.01,0.21308159828186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,4,power_law_1.2,0.09535359740257263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,4,power_law_1.01,0.22537600994110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,2,power_law_1.01,0.022047999501228332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,4,power_law_1.2,0.11665920019149781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,4,power_law_1.01,0.2519999980926514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,2,power_law_1.01,0.022035199403762817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,4,power_law_1.2,0.14820480346679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,4,power_law_1.01,0.29456639289855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,2,power_law_1.01,0.02287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,4,power_law_1.2,0.15475840568542482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,4,power_law_1.01,0.32365438938140867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,2,power_law_1.01,0.026144000887870788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,4,power_law_1.2,0.1569983959197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,4,power_law_1.01,0.3943295955657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,2,power_law_1.01,0.03454720079898834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,4,power_law_1.2,0.16046080589294434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,4,power_law_1.01,0.46005759239196775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,2,power_law_1.01,0.03968639969825745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,4,power_law_1.2,0.16417920589447021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,2,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,4,power_law_1.01,0.5919551849365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,4,power_law_1.2,0.16643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,2,power_law_1.01,0.05237119793891907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,4,power_law_1.01,0.7572544097900391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,4,power_law_1.2,0.17359360456466674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,2,power_law_1.01,0.06034560203552246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,4,power_law_1.01,1.000543975830078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,4,power_law_1.2,0.1854848027229309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,2,power_law_1.01,0.06445440053939819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,4,power_law_1.01,1.3218560218811035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,4,power_law_1.2,0.18977919816970826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,2,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,4,power_law_1.01,1.5391615867614745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,4,power_law_1.2,0.19775359630584716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,2,power_law_1.01,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,4,power_law_1.01,2.3755712509155273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,4,power_law_1.2,0.2120896100997925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,2,power_law_1.01,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,4,power_law_1.2,0.23463680744171142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,2,power_law_1.01,0.1215872049331665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,4,power_law_1.01,4.690003204345703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,4,power_law_1.2,0.2622848033905029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,2,power_law_1.01,0.09557759761810303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,4,power_law_1.2,0.29667201042175295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,2,power_law_1.01,0.10766719579696656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,2,power_law_1.01,0.13551360368728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,4,power_law_1.2,0.3228928089141846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,2,power_law_1.2,0.02221439927816391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,2,power_law_1.01,0.13059200048446656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,4,power_law_1.2,0.4091072082519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,2,power_law_1.2,0.02487040013074875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,2,power_law_1.2,0.0271232008934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,4,power_law_1.2,0.4695295810699463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,2,power_law_1.2,0.03450239896774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,4,power_law_1.2,0.64170241355896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,2,power_law_1.2,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,4,power_law_1.2,0.7515520095825196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,2,power_law_1.2,0.0584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,4,power_law_1.2,1.069983959197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,2,power_law_1.2,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,4,power_law_1.2,1.379263973236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,2,power_law_1.2,0.08140159845352173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,4,power_law_1.2,1.6051456451416015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,2,power_law_1.2,0.08672639727592468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,2,power_law_1.2,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,4,power_law_1.2,2.6344064712524413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,2,power_law_1.2,0.10351999998092651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,4,power_law_1.2,5.191199874877929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,2,power_law_1.2,0.11068799495697021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,2,power_law_1.2,0.11887999773025512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,2,power_law_1.2,0.13772159814834595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,2,power_law_1.2,0.1254271984100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,2,power_law_1.2,0.13299200534820557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,2,power_law_1.2,0.15450880527496338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,2,power_law_1.2,0.15635199546813966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,2,power_law_1.01,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,2,power_law_1.2,0.18217600584030152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,2,power_law_1.01,0.0886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,2,power_law_1.2,0.20837759971618652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,2,power_law_1.01,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,2,power_law_1.01,0.10047999620437623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,2,power_law_1.2,0.24747519493103026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,2,power_law_1.01,0.13304959535598754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,2,power_law_1.2,0.3142591953277588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,2,power_law_1.01,0.1588544011116028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,2,power_law_1.2,0.4039423942565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,2,power_law_1.01,0.19610879421234131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,2,power_law_1.2,0.5538688182830811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,2,power_law_1.01,0.20145280361175538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,2,power_law_1.2,0.7068416118621826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,2,power_law_1.01,0.21189119815826415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,2,power_law_1.2,0.9845696449279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,2,power_law_1.01,0.21434879302978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,2,power_law_1.2,1.2984383583068848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,2,power_law_1.01,0.22232320308685302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,2,power_law_1.2,1.6804607391357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,2,power_law_1.01,0.2264319896697998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,2,power_law_1.2,2.591001510620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,2,power_law_1.01,0.2391103982925415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,2,power_law_1.01,0.24732160568237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,2,power_law_1.2,5.067033767700195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,2,power_law_1.01,0.26248319149017335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,2,power_law_1.01,0.2637887954711914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,2,power_law_1.01,0.2854079961776733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,2,power_law_1.01,0.3009727954864502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,2,power_law_1.01,0.3478143930435181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,2,power_law_1.01,0.4089216232299805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,2,power_law_1.2,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,2,power_law_1.01,0.43471360206604004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,2,power_law_1.2,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,2,power_law_1.01,0.5567808151245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,2,power_law_1.2,0.09184640049934387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,2,power_law_1.01,0.6284671783447265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,2,power_law_1.2,0.10229120254516602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,2,power_law_1.01,0.8527104377746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,2,power_law_1.2,0.12215039730072022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,2,power_law_1.01,1.0177663803100585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,2,power_law_1.2,0.15164799690246583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,2,power_law_1.01,1.433664035797119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,2,power_law_1.2,0.19096319675445556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,2,power_law_1.01,1.8038015365600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,2,power_law_1.2,0.19916160106658937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,2,power_law_1.01,2.1976320266723635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,2,power_law_1.2,0.20734720230102538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,2,power_law_1.01,3.4094337463378905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,2,power_law_1.2,0.2243328094482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,2,power_law_1.2,0.225164794921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,2,power_law_1.01,6.789453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,2,power_law_1.2,0.23294079303741455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,2,power_law_1.2,0.23840639591217042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,2,power_law_1.2,0.24666879177093506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,1,power_law_1.01,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,2,power_law_1.2,0.25895678997039795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,1,power_law_1.01,0.02162559926509857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,2,power_law_1.2,0.2808768033981323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,1,power_law_1.01,0.023270399868488313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,2,power_law_1.2,0.2925503969192505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,1,power_law_1.01,0.027379199862480164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,2,power_law_1.2,0.3263488054275513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,1,power_law_1.01,0.046009600162506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,2,power_law_1.2,0.35514240264892577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,1,power_law_1.01,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,2,power_law_1.2,0.43795199394226075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,1,power_law_1.01,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,2,power_law_1.2,0.4645120143890381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,1,power_law_1.01,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,2,power_law_1.2,0.5596223831176758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,1,power_law_1.01,0.06793599724769592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,2,power_law_1.2,0.6441855907440186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,1,power_law_1.01,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,2,power_law_1.2,0.8682175636291504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,1,power_law_1.01,0.07879679799079894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,2,power_law_1.2,1.0650495529174804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,1,power_law_1.01,0.09147520065307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,2,power_law_1.2,1.4427007675170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,1,power_law_1.01,0.09902719855308532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,2,power_law_1.2,1.9215167999267577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,1,power_law_1.01,0.11789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,2,power_law_1.2,2.2151935577392576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,1,power_law_1.01,0.10089600086212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,8,power_law_1.2,1.1551551818847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,1,power_law_1.01,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,2,power_law_1.2,3.390150451660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,8,power_law_1.2,1.421388816833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,1,power_law_1.01,0.13224320411682128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,8,power_law_1.2,2.1291776657104493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,1,power_law_1.01,0.13264000415802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,2,power_law_1.2,7.544710540771485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.01,0.1608896017074585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,8,power_law_1.2,4.441363143920898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.01,0.17552000284194946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.01,0.21166720390319824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,1,power_law_1.2,0.02220800071954727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.01,0.2905280113220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,1,power_law_1.2,0.02364159971475601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.01,0.36017279624938964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,1,power_law_1.2,0.025900799036026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.01,0.5203199863433838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,1,power_law_1.2,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.01,0.6663360118865966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,1,power_law_1.2,0.05777279734611511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,1,power_law_1.2,0.07217919826507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.01,0.9719039916992187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,1,power_law_1.2,0.08568320274353028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.01,1.2797311782836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,1,power_law_1.2,0.09468160271644592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,1,power_law_1.01,1.5785216331481933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,1,power_law_1.01,0.0959231972694397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,1,power_law_1.2,0.09983360171318054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,1,power_law_1.01,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,1,power_law_1.01,2.491526412963867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,1,power_law_1.2,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,1,power_law_1.01,0.11518720388412476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,1,power_law_1.2,0.1172287940979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,1,power_law_1.01,4.913075256347656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,1,power_law_1.01,0.14528640508651733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,1,power_law_1.2,0.1220736026763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,1,power_law_1.2,0.13607679605484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,1,power_law_1.01,0.18276480436325074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,1,power_law_1.2,0.1540735960006714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,1,power_law_1.01,0.22721281051635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,1,power_law_1.2,0.1407807946205139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,1,power_law_1.01,0.3027712106704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,1,power_law_1.2,0.15409280061721803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,1,power_law_1.01,0.32284159660339357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,1,power_law_1.2,0.1733440041542053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,1,power_law_1.01,0.3396415948867798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,1,power_law_1.2,0.18644479513168336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,1,power_law_1.01,0.34209280014038085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.2,0.2091968059539795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,1,power_law_1.01,0.3502784013748169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.2,0.23602559566497802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,1,power_law_1.2,0.0949504017829895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,1,power_law_1.01,0.37445759773254395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.2,0.27716479301452634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,1,power_law_1.2,0.10212479829788208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,1,power_law_1.01,0.367903995513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.2,0.34866559505462646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,1,power_law_1.2,0.11093120574951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,1,power_law_1.01,0.39370880126953123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.2,0.4266751766204834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,1,power_law_1.2,0.13919999599456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,1,power_law_1.01,0.3945280075073242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,1,power_law_1.2,0.17237119674682616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.2,0.5854015827178956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,1,power_law_1.01,0.42626562118530276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,1,power_law_1.2,0.21496319770812988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.2,0.7318272113800048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,1,power_law_1.01,0.44573440551757815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,1,power_law_1.2,0.2985152006149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.2,1.0304320335388184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,1,power_law_1.01,0.5149504184722901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,1,power_law_1.2,0.3069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.01,0.5591807842254639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.2,1.3447744369506835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,1,power_law_1.2,0.33578879833221437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.01,0.6744895935058594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,1,power_law_1.2,1.6423744201660155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,1,power_law_1.2,0.33231360912323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.01,0.7305920124053955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,1,power_law_1.2,2.5496063232421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,1,power_law_1.2,0.3583296060562134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.01,0.9280192375183105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,1,power_law_1.2,0.3726655960083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,1,power_law_1.2,4.9798015594482425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.01,1.0552063941955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,1,power_law_1.2,0.3827008008956909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.01,1.4094847679138183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,1,power_law_1.2,0.38453121185302735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.01,1.735763168334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,2,power_law_1.01,0.16376960277557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,1,power_law_1.2,0.41751680374145506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.01,2.42224006652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,2,power_law_1.01,0.17441920042037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,1,power_law_1.2,0.4269248008728027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,2,power_law_1.01,0.22480640411376954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,1,power_law_1.2,0.46788477897644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,16,power_law_1.01,0.028358399868011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.01,3.131059265136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,16,power_law_1.01,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,2,power_law_1.01,0.3196223974227905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,1,power_law_1.2,0.5256576061248779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,1,power_law_1.01,3.829011154174805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,16,power_law_1.01,0.022201600670814513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,2,power_law_1.01,0.4126016139984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.2,0.5780735969543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,16,power_law_1.01,0.025484800338745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,1,power_law_1.01,5.816608047485351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,2,power_law_1.01,0.5850368022918702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.2,0.6720831871032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,16,power_law_1.01,0.02999039888381958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.2,0.740883207321167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,2,power_law_1.01,0.7646463871002197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,16,power_law_1.01,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,1,power_law_1.01,11.349260711669922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.2,0.9354432106018067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,16,power_law_1.01,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,2,power_law_1.01,1.125708770751953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,16,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.2,1.065497589111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,2,power_law_1.01,1.5150336265563964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,16,power_law_1.01,0.04330880045890808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.2,1.409984016418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,2,power_law_1.01,1.8742528915405274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,16,power_law_1.01,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.2,1.741548728942871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,16,power_law_1.01,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,2,power_law_1.01,2.9738239288330077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,16,power_law_1.2,0.02791680097579956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.2,2.415763282775879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,16,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,16,power_law_1.2,0.02178560048341751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,16,power_law_1.01,0.051500797271728516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.2,3.1323328018188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,2,power_law_1.01,5.783468627929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,16,power_law_1.2,0.022809599339962006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,16,power_law_1.01,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,1,power_law_1.2,3.845452880859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,16,power_law_1.2,0.022617599368095397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,16,power_law_1.01,0.04822399914264679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,16,power_law_1.2,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,16,power_law_1.01,0.05455999970436096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,1,power_law_1.2,5.833049774169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,16,power_law_1.01,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,16,power_law_1.2,0.03326080143451691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,16,power_law_1.01,0.06501759886741638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,16,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,16,power_law_1.2,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,16,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,1,power_law_1.2,11.426739501953126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,16,power_law_1.01,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,16,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.01,0.10042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,16,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.01,0.12768640518188476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,16,power_law_1.2,0.04350079894065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,16,power_law_1.01,0.04439040124416351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.01,0.16593919992446898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,16,power_law_1.2,0.04739840030670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,16,power_law_1.01,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,16,power_law_1.2,0.08591359853744507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.01,0.22126080989837646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,16,power_law_1.2,0.05804160237312317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,16,power_law_1.01,0.05256320238113403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,16,power_law_1.2,0.04169600009918213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.01,0.3171072006225586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,16,power_law_1.01,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,16,power_law_1.2,0.04801279902458191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,16,power_law_1.2,0.04129279851913452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.01,0.47235841751098634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,16,power_law_1.01,0.051123201847076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,16,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,16,power_law_1.2,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,16,power_law_1.2,0.044972801208496095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.01,0.5898880004882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,16,power_law_1.2,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,16,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,16,power_law_1.2,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.01,0.9264063835144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,16,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,16,power_law_1.2,0.05619840025901794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.01,1.1543359756469727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,16,power_law_1.2,0.05440000295639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,16,power_law_1.2,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,16,power_law_1.01,1.4789376258850098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,16,power_law_1.2,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,16,power_law_1.2,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,16,power_law_1.01,2.3563072204589846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,16,power_law_1.2,0.05500159859657287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.2,0.10862079858779908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,16,power_law_1.2,0.0531711995601654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.2,0.1508095979690552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,16,power_law_1.01,5.058438491821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,16,power_law_1.2,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.2,0.19997440576553344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,16,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.2,0.2757440090179443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,16,power_law_1.2,0.061766397953033444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.2,0.3633984088897705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,16,power_law_1.2,0.06813439726829529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.2,0.546073579788208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,8,power_law_1.01,0.023443199694156647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,16,power_law_1.2,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.2,0.7412415981292725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,8,power_law_1.01,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,16,power_law_1.2,0.07795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,8,power_law_1.01,0.023852799832820893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.2,0.9329536437988282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,16,power_law_1.2,0.0896127998828888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,8,power_law_1.01,0.025491198897361754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.2,1.4904000282287597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.2,0.09598079919815064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,8,power_law_1.01,0.029177600145339967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.2,0.11727360486984253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,16,power_law_1.2,1.8426559448242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,8,power_law_1.01,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.2,0.12750719785690307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,8,power_law_1.01,0.036748799681663516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,16,power_law_1.2,3.0212799072265626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.2,0.15700479745864868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,8,power_law_1.01,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.2,0.20965120792388917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,16,power_law_1.2,6.466835021972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,8,power_law_1.01,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.2,0.26575360298156736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,8,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.2,0.3194240093231201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,8,power_law_1.01,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,8,power_law_1.01,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.2,0.49205760955810546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,8,power_law_1.01,0.053548800945281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.2,0.7101696014404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,8,power_law_1.2,0.02261119931936264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,8,power_law_1.01,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,8,power_law_1.2,0.02056960016489029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,16,power_law_1.2,1.0198335647583008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,8,power_law_1.01,0.05416319966316223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,8,power_law_1.2,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,16,power_law_1.2,1.5215999603271484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,8,power_law_1.01,0.06030719876289368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,8,power_law_1.2,0.024038399755954742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,8,power_law_1.01,0.05682560205459595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,8,power_law_1.2,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,16,power_law_1.2,3.2943294525146483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,8,power_law_1.01,0.07075200080871583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,8,power_law_1.2,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,8,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,8,power_law_1.2,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,8,power_law_1.01,0.10536320209503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,8,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,8,power_law_1.01,0.055219197273254396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,8,power_law_1.01,0.12951680421829223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,8,power_law_1.2,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,8,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,8,power_law_1.01,0.1809280037879944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,8,power_law_1.2,0.04800640046596527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,8,power_law_1.01,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,8,power_law_1.01,0.24174079895019532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,8,power_law_1.2,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,8,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,8,power_law_1.01,0.36135039329528806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,8,power_law_1.2,0.048819199204444885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,8,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,8,power_law_1.01,0.45720958709716797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,8,power_law_1.2,0.0541375994682312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,8,power_law_1.01,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,8,power_law_1.01,0.6474688053131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,8,power_law_1.2,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,8,power_law_1.01,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,8,power_law_1.2,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,8,power_law_1.01,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,8,power_law_1.01,0.8489919662475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,8,power_law_1.01,0.060127997398376466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,8,power_law_1.2,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,8,power_law_1.01,1.0842944145202638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,8,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,8,power_law_1.2,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,8,power_law_1.01,1.7238784790039063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,8,power_law_1.01,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,8,power_law_1.2,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,8,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,8,power_law_1.2,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,8,power_law_1.01,3.0843072891235352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,8,power_law_1.01,0.0652671992778778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,8,power_law_1.2,0.11189759969711303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,8,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,8,power_law_1.2,0.1438591957092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,8,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,8,power_law_1.2,0.19505280256271362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,8,power_law_1.2,0.05619840025901794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,8,power_law_1.01,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,8,power_law_1.2,0.24707839488983155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,8,power_law_1.2,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,8,power_law_1.01,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,8,power_law_1.2,0.36338560581207274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,8,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,8,power_law_1.01,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,8,power_law_1.2,0.4768511772155762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,8,power_law_1.2,0.04700160026550293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,8,power_law_1.01,0.10130560398101807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,8,power_law_1.2,0.047814399003982544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,8,power_law_1.2,0.6818624019622803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,8,power_law_1.01,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,8,power_law_1.2,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,8,power_law_1.2,0.9943807601928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,8,power_law_1.01,0.12814079523086547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,8,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,8,power_law_1.2,1.1956928253173829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,8,power_law_1.01,0.17032320499420167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,8,power_law_1.2,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,8,power_law_1.01,0.19572479724884034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,8,power_law_1.2,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,8,power_law_1.2,1.9788543701171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,8,power_law_1.01,0.25674240589141845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,8,power_law_1.2,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,8,power_law_1.2,4.307212829589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,8,power_law_1.2,0.06213120222091675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,8,power_law_1.01,0.32836480140686036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,8,power_law_1.2,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,8,power_law_1.01,0.46010241508483884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,8,power_law_1.2,0.06787840127944947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,8,power_law_1.01,0.6292672157287598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,8,power_law_1.2,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,8,power_law_1.01,0.701151990890503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,4,power_law_1.01,0.019942399859428406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,8,power_law_1.2,0.07505919933319091
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,8,power_law_1.01,1.0888511657714843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,4,power_law_1.01,0.01932799965143204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,8,power_law_1.2,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,4,power_law_1.01,0.020761600136756896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,8,power_law_1.2,0.08343039751052857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,8,power_law_1.01,2.3116992950439452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,8,power_law_1.2,0.09610880017280579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,4,power_law_1.01,0.02240640074014664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,8,power_law_1.2,0.1080064058303833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,4,power_law_1.01,0.025472000241279602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,8,power_law_1.2,0.12602880001068115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,4,power_law_1.01,0.032441601157188416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,8,power_law_1.2,0.13854080438613892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,4,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,4,power_law_1.2,0.01897599995136261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,8,power_law_1.2,0.19301120042800904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,4,power_law_1.01,0.03592959940433502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,4,power_law_1.2,0.018969599902629853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,8,power_law_1.2,0.21759359836578368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,4,power_law_1.01,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,4,power_law_1.2,0.020403200387954713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,8,power_law_1.2,0.27778561115264894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,4,power_law_1.2,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,4,power_law_1.01,0.04371840059757233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,4,power_law_1.2,0.024294400215148927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,4,power_law_1.01,0.04999679923057556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,8,power_law_1.2,0.362988805770874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,4,power_law_1.2,0.0324864000082016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,4,power_law_1.01,0.044940799474716187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,8,power_law_1.2,0.5104447841644287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,4,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,4,power_law_1.01,0.04780159890651703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,8,power_law_1.2,0.7666431903839112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,4,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,4,power_law_1.01,0.05538560152053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,8,power_law_1.2,0.960812759399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,4,power_law_1.2,0.04251520037651062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,4,power_law_1.01,0.0529151976108551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,8,power_law_1.2,1.676780891418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,4,power_law_1.2,0.04434559941291809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,4,power_law_1.01,0.05456640124320984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,4,power_law_1.2,0.05051519870758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,4,power_law_1.01,0.06520959734916687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,8,power_law_1.2,2.984012794494629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,4,power_law_1.2,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,4,power_law_1.01,0.06766080260276794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,4,power_law_1.2,0.04867840111255646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,4,power_law_1.01,0.07954559922218322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,4,power_law_1.2,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,4,power_law_1.01,0.10042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,4,power_law_1.2,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,4,power_law_1.01,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,4,power_law_1.01,0.12583039999008178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,4,power_law_1.2,0.055027198791503903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,4,power_law_1.01,0.04657920002937317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,4,power_law_1.01,0.1590016007423401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,4,power_law_1.2,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,4,power_law_1.01,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,4,power_law_1.01,0.20405120849609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,4,power_law_1.2,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,4,power_law_1.01,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,4,power_law_1.01,0.3052351951599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,4,power_law_1.2,0.0806335985660553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,4,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,4,power_law_1.01,0.3812031984329224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,4,power_law_1.2,0.10232959985733033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,4,power_law_1.01,0.06664320230484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,4,power_law_1.01,0.5477248191833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,4,power_law_1.2,0.12609280347824098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,4,power_law_1.01,0.07258880138397217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,4,power_law_1.01,0.758457612991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,4,power_law_1.01,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,4,power_law_1.2,0.17032959461212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,4,power_law_1.01,0.07463679909706115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,4,power_law_1.2,0.21477758884429932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,4,power_law_1.01,0.9550656318664551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,4,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,4,power_law_1.2,0.30919039249420166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,4,power_law_1.01,1.4693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,4,power_law_1.01,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,4,power_law_1.2,0.3902719974517822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,4,power_law_1.01,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,4,power_law_1.01,2.661446380615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,4,power_law_1.2,0.6194176197052002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,4,power_law_1.01,0.07955200076103211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,4,power_law_1.2,0.7548031806945801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,4,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,4,power_law_1.2,0.9813247680664062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,4,power_law_1.01,0.09367039799690247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,4,power_law_1.01,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,4,power_law_1.2,1.6174335479736328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,4,power_law_1.2,0.05454720258712768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,4,power_law_1.01,0.10350719690322877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,4,power_law_1.2,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,4,power_law_1.2,3.240275192260742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,4,power_law_1.01,0.11784319877624512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,4,power_law_1.2,0.04534400105476379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,4,power_law_1.01,0.12910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,4,power_law_1.2,0.04984320104122162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,4,power_law_1.01,0.15123200416564941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,4,power_law_1.2,0.05395200252532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,4,power_law_1.01,0.16209280490875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,4,power_law_1.2,0.06909440159797668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,16,power_law_1.01,0.021433599293231964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,4,power_law_1.01,0.2134783983230591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,4,power_law_1.2,0.07074559926986694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,16,power_law_1.01,0.021427200734615327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,4,power_law_1.01,0.24790399074554442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,4,power_law_1.2,0.07482240200042725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,16,power_law_1.01,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,4,power_law_1.01,0.3617664098739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,4,power_law_1.2,0.07401599884033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,16,power_law_1.01,0.02101760059595108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,4,power_law_1.01,0.4236032009124756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,4,power_law_1.2,0.07648000121116638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,16,power_law_1.01,0.023270399868488313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,4,power_law_1.01,0.6392640113830567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,4,power_law_1.2,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,16,power_law_1.01,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,4,power_law_1.01,0.8387455940246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,4,power_law_1.2,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,16,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,4,power_law_1.01,0.9538368225097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,4,power_law_1.2,0.07852799892425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,16,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,4,power_law_1.01,1.513753604888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,4,power_law_1.2,0.08240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,16,power_law_1.01,0.04784640073776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,4,power_law_1.2,0.09245439767837524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,16,power_law_1.01,0.05278080105781555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,4,power_law_1.01,3.1750911712646483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,4,power_law_1.2,0.09694079756736755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,16,power_law_1.01,0.06381440162658691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,16,power_law_1.01,0.05297920107841492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,4,power_law_1.2,0.10103679895401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,16,power_law_1.01,0.07528960108757018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,16,power_law_1.01,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,16,power_law_1.01,0.055212801694869994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,4,power_law_1.2,0.11883519887924195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,16,power_law_1.01,0.05440000295639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,16,power_law_1.01,0.0666815996170044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,4,power_law_1.2,0.12910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,16,power_law_1.01,0.05398399829864502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,16,power_law_1.01,0.07896959781646729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,4,power_law_1.2,0.1647487998008728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,16,power_law_1.01,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,16,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,4,power_law_1.2,0.17375359535217286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,16,power_law_1.01,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,16,power_law_1.01,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,16,power_law_1.01,0.06750079989433289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,4,power_law_1.2,0.21738240718841553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,16,power_law_1.01,0.08552320003509521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,4,power_law_1.2,0.2729023933410645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,16,power_law_1.2,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.01,0.10498559474945068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,4,power_law_1.2,0.3756864070892334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,16,power_law_1.2,0.034297600388526917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.01,0.1486143946647644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,16,power_law_1.2,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,4,power_law_1.2,0.44408321380615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.01,0.18916480541229247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,16,power_law_1.2,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,4,power_law_1.2,0.6437695980072021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,16,power_law_1.2,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.01,0.2725183963775635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,4,power_law_1.2,0.9316927909851074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,16,power_law_1.2,0.06317440271377564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.01,0.35831680297851565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,4,power_law_1.2,1.149824047088623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,16,power_law_1.2,0.06869760155677795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.01,0.5276927947998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,4,power_law_1.2,1.7271551132202148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,16,power_law_1.2,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.01,0.6958335876464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,16,power_law_1.2,0.08631680011749268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.01,1.03373441696167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,4,power_law_1.2,3.8671039581298827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,16,power_law_1.2,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.01,1.3681920051574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,16,power_law_1.2,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,16,power_law_1.01,1.707526397705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,16,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,16,power_law_1.2,0.1045375943183899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,16,power_law_1.01,2.709849548339844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,16,power_law_1.01,0.101254403591156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,16,power_law_1.2,0.12439680099487305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,16,power_law_1.01,0.10350719690322877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,16,power_law_1.01,5.395782470703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,16,power_law_1.2,0.1522752046585083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,16,power_law_1.01,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,16,power_law_1.2,0.11273599863052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,16,power_law_1.01,0.08057600259780884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,16,power_law_1.2,0.13054720163345337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,16,power_law_1.01,0.08405759930610657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,16,power_law_1.2,0.1823232054710388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,16,power_law_1.01,0.10207359790802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.2,0.2380608081817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,16,power_law_1.2,0.17893120050430297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,16,power_law_1.2,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.2,0.3226560115814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,16,power_law_1.01,0.10412160158157349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,16,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.2,0.43384318351745604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,16,power_law_1.01,0.10576000213623046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,16,power_law_1.2,0.08451200127601624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.2,0.6169600009918212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,16,power_law_1.01,0.10801279544830322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,16,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.2,0.791648006439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,16,power_law_1.01,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,16,power_law_1.2,0.10291839838027954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,16,power_law_1.01,0.1086016058921814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.2,1.1752256393432616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,16,power_law_1.2,0.10376960039138794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,16,power_law_1.01,0.10985599756240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.2,1.543673610687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,16,power_law_1.2,0.10683519840240478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,16,power_law_1.01,0.11128959655761719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.2,2.526495933532715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,16,power_law_1.2,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,16,power_law_1.01,0.11559040546417236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.2,3.2140033721923826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,16,power_law_1.2,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,16,power_law_1.01,0.12050559520721435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,16,power_law_1.2,4.07088623046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,16,power_law_1.2,0.10887680053710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,16,power_law_1.01,0.12604160308837892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,16,power_law_1.2,0.11153919696807861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,16,power_law_1.01,0.13074560165405275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,16,power_law_1.2,6.9147392272949215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,16,power_law_1.2,0.11173759698867798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,16,power_law_1.01,0.1475391983985901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,16,power_law_1.2,0.11912959814071655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.01,0.16187520027160646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,16,power_law_1.2,15.109613037109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,16,power_law_1.2,0.12199679613113404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.01,0.20364160537719728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,16,power_law_1.2,0.12730239629745482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.01,0.2052992105484009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,16,power_law_1.2,0.14165120124816893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.01,0.25588479042053225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,16,power_law_1.2,0.15741440057754516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.01,0.31587839126586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,8,power_law_1.01,0.0361407995223999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.2,0.17237119674682616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.01,0.42789759635925295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,8,power_law_1.01,0.04535680115222931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.2,0.20288000106811524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,8,power_law_1.01,0.03368319869041443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.01,0.520684814453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.2,0.2315392017364502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,8,power_law_1.01,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.01,0.7150464057922363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.2,0.2981247901916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,8,power_law_1.01,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.2,0.35177600383758545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.01,0.9542400360107421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,8,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.2,0.44742398262023925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,16,power_law_1.01,1.243622398376465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,8,power_law_1.01,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.2,0.6059391975402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,16,power_law_1.01,1.681292724609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.2,0.9305215835571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.2,1.11014404296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,16,power_law_1.01,3.444947052001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,16,power_law_1.2,1.3550848007202148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,16,power_law_1.2,2.093177604675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,8,power_law_1.2,0.02240640074014664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,16,power_law_1.2,6.256576156616211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,8,power_law_1.2,0.02261119931936264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,8,power_law_1.2,0.023520000278949738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,8,power_law_1.2,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,8,power_law_1.2,0.03258880078792572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,8,power_law_1.2,0.04288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,8,power_law_1.01,0.08266239762306213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,8,power_law_1.2,0.0529151976108551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,8,power_law_1.01,0.0810368001461029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,8,power_law_1.2,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,8,power_law_1.01,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,8,power_law_1.01,0.07608320116996765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,8,power_law_1.01,0.08757759928703308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,8,power_law_1.01,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,8,power_law_1.01,0.10636160373687745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,8,power_law_1.01,0.10991359949111938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,8,power_law_1.01,0.1064255952835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,8,power_law_1.01,0.1137984037399292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,8,power_law_1.01,0.11502079963684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,8,power_law_1.01,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,8,power_law_1.01,0.1180351972579956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,8,power_law_1.01,0.11832319498062134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,8,power_law_1.01,0.12896000146865844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,8,power_law_1.01,0.12916480302810668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,8,power_law_1.01,0.14493440389633178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,8,power_law_1.01,0.1568063974380493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,8,power_law_1.01,0.17894400358200074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,8,power_law_1.01,0.20514559745788574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,8,power_law_1.01,0.2405695915222168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,8,power_law_1.01,0.2710720062255859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,8,power_law_1.01,0.336627197265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,8,power_law_1.01,0.4287231922149658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,8,power_law_1.01,0.558016014099121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,8,power_law_1.01,0.7671103954315186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,8,power_law_1.01,0.9055487632751464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,8,power_law_1.01,1.238764762878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,8,power_law_1.01,1.8075008392333984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,8,power_law_1.01,3.6099456787109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,8,power_law_1.2,0.08225280046463013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,8,power_law_1.2,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,8,power_law_1.2,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,8,power_law_1.2,0.07735040187835693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,8,power_law_1.2,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,8,power_law_1.2,0.09822720289230347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,8,power_law_1.2,0.10396800041198731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,8,power_law_1.2,0.11093120574951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,8,power_law_1.2,0.10847359895706177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,8,power_law_1.2,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,8,power_law_1.2,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,8,power_law_1.2,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,8,power_law_1.2,0.11953279972076417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,8,power_law_1.2,0.12321280241012574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,8,power_law_1.2,0.12936960458755492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,8,power_law_1.2,0.14001280069351196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,8,power_law_1.2,0.14697599411010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,8,power_law_1.2,0.16533119678497316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,8,power_law_1.2,0.18547840118408204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,8,power_law_1.2,0.21313281059265138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,8,power_law_1.2,0.2272576093673706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,8,power_law_1.2,0.2882879972457886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,8,power_law_1.2,0.36488320827484133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,8,power_law_1.2,0.46790399551391604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,8,power_law_1.2,0.5707071781158447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,8,power_law_1.2,0.7388415813446045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,8,power_law_1.2,0.9886655807495117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,8,power_law_1.2,1.3649151802062989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,16,power_law_1.01,0.07037439942359924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,8,power_law_1.2,2.09564151763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,16,power_law_1.01,0.08430079817771911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,8,power_law_1.2,4.451251220703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.01,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.01,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.01,0.11663360595703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.01,0.15845119953155518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.01,0.18096640110015869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,4,power_law_1.01,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.01,0.22848000526428222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,4,power_law_1.01,0.024505600333213806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.01,0.3054975986480713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,4,power_law_1.01,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,4,power_law_1.01,0.02942720055580139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.01,0.4015552043914795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,4,power_law_1.01,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.01,0.5838143825531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,4,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,16,power_law_1.01,0.6720831871032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,4,power_law_1.01,0.04374400079250336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,16,power_law_1.01,1.0440064430236817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,4,power_law_1.01,0.052127999067306516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,4,power_law_1.01,0.059935998916625974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,16,power_law_1.01,1.8418752670288085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,4,power_law_1.01,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,4,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,4,power_law_1.01,0.08595200181007386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,4,power_law_1.01,0.07345280051231384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,4,power_law_1.2,0.022649599611759184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,4,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,4,power_law_1.2,0.024512000381946564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,4,power_law_1.01,0.09080320000648498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,4,power_law_1.2,0.02983039915561676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,4,power_law_1.01,0.08449919819831848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,4,power_law_1.01,0.08533759713172913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,4,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,4,power_law_1.01,0.09946879744529724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,4,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,4,power_law_1.2,0.04254080057144165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,4,power_law_1.01,0.13017599582672118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,4,power_law_1.2,0.047865599393844604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,4,power_law_1.01,0.1739776015281677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,4,power_law_1.2,0.05767679810523987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,4,power_law_1.01,0.225164794921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,4,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,4,power_law_1.01,0.32064640522003174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,4,power_law_1.2,0.07162240147590637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,4,power_law_1.01,0.4201663970947266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,4,power_law_1.2,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,4,power_law_1.01,0.6161727905273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,4,power_law_1.2,0.0886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,4,power_law_1.01,0.806828784942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,4,power_law_1.2,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,4,power_law_1.01,1.197804832458496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,4,power_law_1.2,0.07796480059623719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,4,power_law_1.01,1.6030975341796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,4,power_law_1.2,0.0902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,4,power_law_1.01,1.997337532043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,4,power_law_1.2,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,4,power_law_1.2,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,4,power_law_1.01,3.1743040084838867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,4,power_law_1.2,0.0986303985118866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,4,power_law_1.2,0.12363519668579101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,4,power_law_1.01,6.318150329589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,4,power_law_1.2,0.1539520025253296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,4,power_law_1.2,0.20084478855133056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,4,power_law_1.2,0.26740479469299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,4,power_law_1.2,0.38147199153900146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,4,power_law_1.2,0.5276991844177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,4,power_law_1.01,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,4,power_law_1.2,0.7302591800689697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,4,power_law_1.01,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,4,power_law_1.01,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,4,power_law_1.2,1.0415360450744628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,4,power_law_1.01,0.08145279884338379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,4,power_law_1.2,1.3296895980834962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,4,power_law_1.01,0.09597439765930176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,8,power_law_1.01,0.0693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,4,power_law_1.2,1.539187240600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,4,power_law_1.01,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,8,power_law_1.01,0.07627519965171814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,4,power_law_1.2,2.6156415939331055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,4,power_law_1.01,0.12444800138473511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,8,power_law_1.01,0.08178560137748718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,4,power_law_1.01,0.12526079416275024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,8,power_law_1.01,0.09441919922828675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,4,power_law_1.2,5.225196838378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,4,power_law_1.01,0.12874879837036132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,8,power_law_1.01,0.10618239641189575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,4,power_law_1.01,0.13385599851608276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,8,power_law_1.01,0.08363519906997681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,4,power_law_1.01,0.1379647970199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,8,power_law_1.01,0.09879680275917054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,8,power_law_1.01,0.11252479553222657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,4,power_law_1.01,0.13876479864120483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,8,power_law_1.01,0.09081599712371827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,4,power_law_1.2,0.08123520016670227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,4,power_law_1.2,0.06690559983253479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,8,power_law_1.01,0.10736639499664306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,4,power_law_1.2,0.0695680022239685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,8,power_law_1.01,0.13649280071258546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,8,power_law_1.01,0.16475520133972169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,4,power_law_1.2,0.07898880243301391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,8,power_law_1.01,0.22435200214385986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,4,power_law_1.2,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,8,power_law_1.2,0.06335999965667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,4,power_law_1.2,0.11790080070495605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,8,power_law_1.2,0.07217919826507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,4,power_law_1.2,0.12444800138473511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,8,power_law_1.2,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,4,power_law_1.2,0.1299839973449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,8,power_law_1.2,0.10369919538497925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,4,power_law_1.2,0.13018239736557008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,8,power_law_1.2,0.07626879811286927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,4,power_law_1.2,0.13181439638137818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,4,power_law_1.2,0.13817600011825562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,8,power_law_1.2,0.09141759872436524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,4,power_law_1.2,0.13878400325775148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,8,power_law_1.2,0.1131327986717224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,4,power_law_1.2,0.1453376054763794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,8,power_law_1.2,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,8,power_law_1.2,0.09941120147705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,4,power_law_1.2,0.14164479970932006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,8,power_law_1.2,0.13237760066986085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,8,power_law_1.2,0.16433279514312743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,8,power_law_1.2,0.2298111915588379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,8,power_law_1.2,0.29580800533294677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,8,power_law_1.2,0.4322048187255859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,8,power_law_1.2,0.5685311794281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,8,power_law_1.2,0.8436544418334961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,8,power_law_1.2,1.119929599761963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,8,power_law_1.2,1.6722047805786133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,8,power_law_1.2,2.226259231567383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,8,power_law_1.2,2.7783487319946287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,8,power_law_1.2,4.431884765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,8,power_law_1.2,8.832697296142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,16,power_law_1.01,0.09919999837875366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,16,power_law_1.01,0.14097919464111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,16,power_law_1.01,0.17415679693222047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,16,power_law_1.01,0.08425599932670594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,16,power_law_1.01,0.10001920461654663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,16,power_law_1.01,0.11722240447998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,16,power_law_1.01,0.1241919994354248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,16,power_law_1.01,0.13320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,16,power_law_1.01,0.14016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,16,power_law_1.01,0.145907199382782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,16,power_law_1.01,0.1536960005760193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,16,power_law_1.01,0.15692800283432007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,16,power_law_1.01,0.15449600219726561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,16,power_law_1.01,0.15205760002136232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,16,power_law_1.01,0.15531519651412964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,16,power_law_1.01,0.17252479791641234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,16,power_law_1.01,0.1771775960922241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,16,power_law_1.01,0.1893183946609497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,16,power_law_1.01,0.20897281169891357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,16,power_law_1.01,0.24236159324645995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,16,power_law_1.01,0.27450881004333494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,16,power_law_1.01,0.34250879287719727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,16,power_law_1.01,0.37445759773254395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,16,power_law_1.01,0.4784895896911621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,16,power_law_1.01,0.5751616001129151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,16,power_law_1.01,0.7903999805450439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,16,power_law_1.01,0.9980735778808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,16,power_law_1.01,1.2837632179260254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,16,power_law_1.01,1.886899185180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,16,power_law_1.01,3.4879295349121096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,16,power_law_1.2,0.10022399425506592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,16,power_law_1.2,0.14097919464111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,16,power_law_1.2,0.12829439640045165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,16,power_law_1.2,0.08118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,16,power_law_1.2,0.09695360064506531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,16,power_law_1.2,0.11169279813766479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,16,power_law_1.2,0.11660799980163575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,16,power_law_1.2,0.14344320297241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,16,power_law_1.2,0.13626879453659058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,16,power_law_1.2,0.14098559617996215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,16,power_law_1.2,0.1467136025428772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,16,power_law_1.2,0.1491711974143982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,16,power_law_1.2,0.15623680353164673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,16,power_law_1.2,0.14999680519104003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,16,power_law_1.2,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,16,power_law_1.2,0.16596479415893556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,16,power_law_1.2,0.17866239547729493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,16,power_law_1.2,0.196288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,16,power_law_1.2,0.2085632085800171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,16,power_law_1.2,0.24563200473785402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,16,power_law_1.2,0.28148479461669923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,16,power_law_1.2,0.35275518894195557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,16,power_law_1.2,0.37589120864868164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,16,power_law_1.2,0.5227263927459717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,16,power_law_1.2,0.6366144180297851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,16,power_law_1.2,0.9440064430236816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,16,power_law_1.2,1.1182847976684571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,16,power_law_1.2,1.5465344429016112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,16,power_law_1.2,2.302028846740723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,16,power_law_1.2,4.696096038818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,8,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,8,power_law_1.01,0.11025919914245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,8,power_law_1.01,0.1538815975189209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,8,power_law_1.01,0.08056960105895997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,4,power_law_1.01,0.14103039503097534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,8,power_law_1.01,0.10124800205230713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,4,power_law_1.01,0.14124159812927245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,8,power_law_1.01,0.12010879516601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,4,power_law_1.01,0.16049920320510863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,8,power_law_1.01,0.13176319599151612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,4,power_law_1.01,0.16335359811782837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,4,power_law_1.01,0.17319040298461913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,8,power_law_1.01,0.1467136025428772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,4,power_law_1.01,0.19612799882888793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,8,power_law_1.01,0.15285760164260864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,8,power_law_1.01,0.28292479515075686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,4,power_law_1.01,0.21413118839263917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,8,power_law_1.01,0.15900800228118897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,8,power_law_1.01,0.39310081005096437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,4,power_law_1.01,0.26451840400695803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,8,power_law_1.01,0.16269439458847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,8,power_law_1.01,0.5342016220092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,4,power_law_1.01,0.26922879219055174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,8,power_law_1.01,0.7707583904266357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,8,power_law_1.01,0.17415679693222047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,4,power_law_1.01,0.3419519901275635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,8,power_law_1.01,0.9923520088195801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,4,power_law_1.01,0.40583038330078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,8,power_law_1.01,0.1686336040496826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,8,power_law_1.01,1.434502410888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,4,power_law_1.01,0.546131181716919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,8,power_law_1.01,0.17294080257415773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,8,power_law_1.01,1.8467775344848634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,4,power_law_1.01,0.6720767974853515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,8,power_law_1.01,0.18583680391311647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,4,power_law_1.01,0.9628992080688477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,8,power_law_1.01,2.2905664443969727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,8,power_law_1.01,0.19055999517440797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,4,power_law_1.2,0.16091519594192505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,4,power_law_1.01,1.3288703918457032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,8,power_law_1.01,0.19813120365142822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,8,power_law_1.01,3.7548801422119142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,4,power_law_1.2,0.160697603225708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,4,power_law_1.01,1.442739200592041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,8,power_law_1.01,0.22024960517883302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,4,power_law_1.2,0.18321919441223145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,8,power_law_1.01,7.505382537841797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,8,power_law_1.01,0.2429503917694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,4,power_law_1.01,2.3235776901245115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,8,power_law_1.01,0.28434560298919676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,4,power_law_1.01,4.469279861450195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,8,power_law_1.01,0.31587839126586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,8,power_law_1.01,0.3732352018356323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,8,power_law_1.2,0.08140159845352173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,8,power_law_1.01,0.40517759323120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,8,power_law_1.2,0.11088639497756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,8,power_law_1.01,0.5522240161895752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,8,power_law_1.2,0.10290559530258178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,4,power_law_1.01,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,8,power_law_1.01,0.6552320003509522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,8,power_law_1.2,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,4,power_law_1.01,0.09248639941215515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,8,power_law_1.01,0.9292608261108398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,8,power_law_1.2,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,4,power_law_1.01,0.12772480249404908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,8,power_law_1.2,0.11435519456863404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,8,power_law_1.01,1.08920316696167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,4,power_law_1.01,0.08677120208740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,8,power_law_1.2,0.12502399682998658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,8,power_law_1.01,1.321446418762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,4,power_law_1.01,0.10497920513153076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,8,power_law_1.2,0.14979840517044068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,8,power_law_1.01,2.0136703491210937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,4,power_law_1.01,0.14451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,8,power_law_1.2,0.1508288025856018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,4,power_law_1.01,0.149017596244812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,8,power_law_1.01,3.8949825286865236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,8,power_law_1.2,0.15900800228118897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,4,power_law_1.01,0.18072320222854615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,8,power_law_1.2,0.1631168007850647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,4,power_law_1.01,0.18793599605560302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,8,power_law_1.2,0.16639360189437866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,4,power_law_1.01,0.1998080015182495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,8,power_law_1.2,0.17212799787521363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,4,power_law_1.01,0.1969472050666809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,8,power_law_1.2,0.17089279890060424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,4,power_law_1.01,0.218668794631958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,4,power_law_1.2,0.08609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,8,power_law_1.2,0.18072320222854615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,4,power_law_1.01,0.21744000911712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,8,power_law_1.2,0.18810240030288697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,4,power_law_1.01,0.218451189994812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,8,power_law_1.2,0.20161280632019044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,4,power_law_1.01,0.22541439533233643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,8,power_law_1.2,0.22659199237823485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,4,power_law_1.01,0.236678409576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,4,power_law_1.01,0.24240000247955323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,8,power_law_1.2,0.25077118873596194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,4,power_law_1.01,0.27292799949645996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,8,power_law_1.2,0.2818943977355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,8,power_law_1.2,0.331443190574646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,4,power_law_1.01,0.3005824089050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,4,power_law_1.01,0.33826560974121095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,8,power_law_1.2,0.3951359987258911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,4,power_law_1.01,0.37757439613342286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,8,power_law_1.2,0.4399871826171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,4,power_law_1.01,0.46789121627807617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,8,power_law_1.2,0.5669760227203369
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,4,power_law_1.01,0.5276927947998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,8,power_law_1.2,0.6962111949920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,4,power_law_1.01,0.6798655986785889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,8,power_law_1.2,0.9722687721252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,4,power_law_1.01,0.8109312057495117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,8,power_law_1.2,1.1964608192443849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,4,power_law_1.01,1.0859840393066407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,8,power_law_1.2,1.6198015213012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,4,power_law_1.01,1.4013888359069824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,8,power_law_1.2,2.2885183334350585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,4,power_law_1.01,1.69486083984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,8,power_law_1.2,4.320742416381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,4,power_law_1.01,2.6033536911010744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,4,power_law_1.01,4.930624008178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,2,power_law_1.01,0.08693119883537292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,2,power_law_1.01,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,2,power_law_1.01,0.11765120029449463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,2,power_law_1.2,0.08751999735832214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,2,power_law_1.2,0.09516159892082214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,2,power_law_1.01,0.10782719850540161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,2,power_law_1.01,0.14550399780273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,2,power_law_1.2,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,2,power_law_1.01,0.18851200342178345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,2,power_law_1.2,0.10929280519485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,2,power_law_1.01,0.2083712100982666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,2,power_law_1.2,0.13530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,2,power_law_1.01,0.2528127908706665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,2,power_law_1.2,0.16520960330963136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,2,power_law_1.01,0.2593535900115967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,2,power_law_1.2,0.187116801738739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,2,power_law_1.01,0.27329919338226316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,2,power_law_1.2,0.23626880645751952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,2,power_law_1.01,0.29066240787506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,2,power_law_1.2,0.2430272102355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,2,power_law_1.01,0.2999232053756714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,2,power_law_1.2,0.2550976037979126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,2,power_law_1.01,0.3025791883468628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,2,power_law_1.2,0.2771712064743042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,2,power_law_1.01,0.3064768075942993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,2,power_law_1.2,0.28991360664367677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,2,power_law_1.01,0.31775360107421874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,2,power_law_1.2,0.3095679998397827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,2,power_law_1.01,0.32019839286804197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,2,power_law_1.2,0.2981247901916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,2,power_law_1.01,0.3341248035430908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,2,power_law_1.2,0.31614079475402834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,2,power_law_1.01,0.37467520236968993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,2,power_law_1.2,0.33006720542907714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,2,power_law_1.01,0.42197117805480955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,2,power_law_1.2,0.348089599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,2,power_law_1.01,0.4887231826782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,2,power_law_1.2,0.38392961025238037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,2,power_law_1.01,0.552236795425415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,2,power_law_1.2,0.4285696029663086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,2,power_law_1.2,0.4866943836212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,2,power_law_1.01,0.6752448081970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,2,power_law_1.01,0.7437183856964111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,2,power_law_1.2,0.5850495815277099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,2,power_law_1.2,0.6823040008544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,2,power_law_1.01,0.9882559776306152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,2,power_law_1.2,0.7830143928527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,2,power_law_1.01,1.1838272094726563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,2,power_law_1.2,0.9972928047180176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,2,power_law_1.01,1.5731648445129394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,2,power_law_1.2,1.1613504409790039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,2,power_law_1.01,2.036204719543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,2,power_law_1.2,1.58340482711792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,2,power_law_1.01,2.4565759658813477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,2,power_law_1.2,2.095648002624512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,2,power_law_1.01,3.64758415222168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,2,power_law_1.2,2.4440128326416017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,2,power_law_1.01,7.1170814514160154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,2,power_law_1.2,3.9817665100097654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,2,power_law_1.2,7.177152252197265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,1,power_law_1.01,0.10982400178909302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,1,power_law_1.01,0.11817599534988403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,1,power_law_1.01,0.13566720485687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,1,power_law_1.2,0.10723199844360351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,1,power_law_1.01,0.15000319480895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,1,power_law_1.2,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,1,power_law_1.01,0.21882240772247313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,1,power_law_1.2,0.1273151993751526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,1,power_law_1.01,0.288044810295105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,1,power_law_1.2,0.15352959632873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,1,power_law_1.01,0.30135679244995117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,1,power_law_1.2,0.20083839893341066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,1,power_law_1.01,0.3941312074661255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,1,power_law_1.2,0.2526592016220093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,1,power_law_1.01,0.41829757690429686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,1,power_law_1.2,0.2923840045928955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,1,power_law_1.01,0.4346816062927246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,1,power_law_1.2,0.3796031951904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,1,power_law_1.01,0.44778881072998045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,1,power_law_1.2,0.39397120475769043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,1,power_law_1.01,0.4740096092224121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,1,power_law_1.2,0.41854081153869627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,1,power_law_1.01,0.47891840934753416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,1,power_law_1.2,0.4556096076965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,4,power_law_1.2,0.19716479778289794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,1,power_law_1.01,0.5022528171539307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,1,power_law_1.2,0.4642047882080078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,4,power_law_1.2,0.21784958839416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,1,power_law_1.01,0.5083968162536621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,1,power_law_1.2,0.4555967807769775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,4,power_law_1.2,0.2444607973098755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,1,power_law_1.01,0.5272448062896729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,1,power_law_1.2,0.4986112117767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,4,power_law_1.2,0.28580479621887206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,1,power_law_1.01,0.5641151905059815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,1,power_law_1.2,0.498195219039917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,4,power_law_1.2,0.3608000040054321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,4,power_law_1.2,0.42140798568725585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,1,power_law_1.01,0.6388671875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,1,power_law_1.2,0.5268799781799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,4,power_law_1.2,0.5604735851287842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,1,power_law_1.01,0.683903980255127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,1,power_law_1.2,0.5846208095550537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,4,power_law_1.2,0.7064896106719971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,1,power_law_1.01,0.8092479705810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,1,power_law_1.2,0.6774015903472901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,4,power_law_1.2,1.0112256050109862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,1,power_law_1.01,0.9124671936035156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,1,power_law_1.2,0.6995327949523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,4,power_law_1.2,1.3477120399475098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,1,power_law_1.01,1.128115177154541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,4,power_law_1.2,1.7230976104736329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,1,power_law_1.01,1.267193603515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,4,power_law_1.2,2.6201408386230467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,1,power_law_1.01,1.6772031784057617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,1,power_law_1.01,1.9772287368774415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,4,power_law_1.2,5.7462207794189455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,1,power_law_1.01,2.6934207916259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,1,power_law_1.01,3.427347183227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,1,power_law_1.01,4.167027282714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,1,power_law_1.01,6.316121673583984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,4,power_law_1.2,0.09428480267524719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,4,power_law_1.2,0.09244800209999085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,1,power_law_1.01,12.153536224365235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,4,power_law_1.2,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,4,power_law_1.2,0.10836479663848878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,4,power_law_1.2,0.13320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,4,power_law_1.2,0.145907199382782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,4,power_law_1.2,0.18195199966430664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,4,power_law_1.2,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,4,power_law_1.2,0.18970880508422852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,4,power_law_1.2,0.20078721046447753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,4,power_law_1.2,0.20115199089050292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,4,power_law_1.2,0.20570878982543944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,4,power_law_1.2,0.20857601165771483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,4,power_law_1.2,0.23088641166687013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,4,power_law_1.2,0.23416318893432617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,power_law_1.01,0.047040000557899475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,4,power_law_1.2,0.25402240753173827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,power_law_1.01,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,power_law_1.01,0.04970879852771759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,4,power_law_1.2,0.2728640079498291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,power_law_1.01,0.046009600162506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,4,power_law_1.2,0.3027647972106934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,power_law_1.01,0.04417920112609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,power_law_1.01,0.04991360008716583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,4,power_law_1.2,0.3568320035934448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,power_law_1.01,0.05441920161247253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,power_law_1.01,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,4,power_law_1.2,0.4029248237609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,power_law_1.01,0.06157439947128296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,4,power_law_1.2,0.46945919990539553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,power_law_1.2,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,power_law_1.01,0.06299520134925843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,power_law_1.2,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,power_law_1.01,0.049292799830436704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,4,power_law_1.2,0.5567296028137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,power_law_1.2,0.04822399914264679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,power_law_1.01,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,4,power_law_1.2,0.7211775779724121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,power_law_1.2,0.0474047988653183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,power_law_1.01,0.05605760216712952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,power_law_1.2,0.04842239916324616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,4,power_law_1.2,0.835865592956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,power_law_1.2,0.052313601970672606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,power_law_1.01,0.07345920205116271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,power_law_1.2,0.052928000688552856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,power_law_1.01,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,4,power_law_1.2,1.1305600166320802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,power_law_1.2,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,power_law_1.01,0.08513280153274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,4,power_law_1.2,1.5633088111877442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,power_law_1.2,0.062745600938797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,power_law_1.01,0.09681280255317688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,power_law_1.2,0.06335999965667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,power_law_1.01,0.11831040382385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,4,power_law_1.2,1.7431295394897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,power_law_1.2,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,power_law_1.01,0.1480191946029663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,power_law_1.2,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,power_law_1.01,0.18199679851531983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,4,power_law_1.2,2.6463039398193358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,power_law_1.2,0.06173440217971802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,power_law_1.01,0.27025279998779295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,power_law_1.2,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,power_law_1.01,0.34131200313568116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,power_law_1.2,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,4,power_law_1.2,5.487488174438477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,power_law_1.01,0.5096640110015869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,power_law_1.2,0.08426240086555481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,power_law_1.01,0.5895487785339355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,power_law_1.2,0.0946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,power_law_1.01,0.9047360420227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,power_law_1.2,0.12420480251312256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,power_law_1.01,1.3370688438415528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,power_law_1.2,0.11395839452743531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,power_law_1.01,1.6948352813720704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,power_law_1.2,0.1549183964729309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,power_law_1.2,0.17007999420166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,power_law_1.01,2.664371109008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,power_law_1.2,0.256710410118103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,power_law_1.01,5.302412796020508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,power_law_1.2,0.3434751987457275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,power_law_1.2,0.4805568218231201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,power_law_1.2,0.6157248020172119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,power_law_1.2,0.9763775825500488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,power_law_1.2,1.335801601409912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,power_law_1.2,1.7017791748046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,power_law_1.2,2.5734079360961912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,power_law_1.2,5.355136108398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,power_law_1.01,0.0438975989818573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,power_law_1.01,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,power_law_1.01,0.0433023989200592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,power_law_1.01,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,power_law_1.01,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,power_law_1.01,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,power_law_1.01,0.04799999892711639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,power_law_1.01,0.05312640070915222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,power_law_1.01,0.053324800729751584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,power_law_1.2,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,power_law_1.01,0.05681920051574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,power_law_1.2,0.04028800129890442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,power_law_1.01,0.05937920212745666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,power_law_1.2,0.051545602083206174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,power_law_1.01,0.05864959955215454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,power_law_1.2,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,power_law_1.01,0.057011198997497556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,power_law_1.2,0.0490880012512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,power_law_1.01,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,power_law_1.2,0.053388798236846925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,power_law_1.01,0.0711359977722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,power_law_1.2,0.04108799993991852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,power_law_1.01,0.07750399708747864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,power_law_1.01,0.03754880130290985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,power_law_1.2,0.045184001326560974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,power_law_1.01,0.09633280038833618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,power_law_1.01,0.03408640027046204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,power_law_1.2,0.04826880097389221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,power_law_1.01,0.0946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,power_law_1.01,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,power_law_1.2,0.0490880012512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,power_law_1.01,0.1164031982421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,power_law_1.01,0.041459199786186215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,power_law_1.2,0.05134080052375793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,power_law_1.01,0.15081599950790406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,power_law_1.01,0.03716480135917664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,power_law_1.2,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,power_law_1.01,0.18911999464035034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,power_law_1.2,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,power_law_1.01,0.25137279033660886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,power_law_1.01,0.057030397653579715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,power_law_1.01,0.04330880045890808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,power_law_1.2,0.06833279728889466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,power_law_1.01,0.044940799474716187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,power_law_1.01,0.05088000297546387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,power_law_1.2,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,power_law_1.01,0.05108479857444763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,power_law_1.2,0.10170880556106568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,power_law_1.01,0.05249919891357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,power_law_1.2,0.13203840255737304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,power_law_1.01,0.06421120166778564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,power_law_1.2,0.14984320402145385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,power_law_1.01,0.0732096016407013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,power_law_1.2,0.1955135941505432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,power_law_1.01,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,power_law_1.2,0.2323904037475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,power_law_1.01,0.07198079824447631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,power_law_1.2,0.3583296060562134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,power_law_1.01,0.08366720080375671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,power_law_1.2,0.5309631824493408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,power_law_1.01,0.08774399757385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,power_law_1.2,0.8600959777832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,power_law_1.01,0.11066880226135253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,power_law_1.2,1.0042559623718261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,power_law_1.01,0.12049920558929443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,power_law_1.2,1.2481792449951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,power_law_1.01,0.1538879990577698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,power_law_1.2,2.3127296447753904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,power_law_1.01,0.2024319887161255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,power_law_1.01,0.29049599170684814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,power_law_1.2,3.8950336456298826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,power_law_1.01,0.37959039211273193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,power_law_1.01,0.5210303783416748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,power_law_1.01,0.68023681640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,power_law_1.01,0.8842111587524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,power_law_1.01,1.2583871841430665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,power_law_1.01,2.5191999435424806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,1,power_law_1.2,0.8215744018554687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,1,power_law_1.2,0.9198975563049316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,1,power_law_1.2,1.1326784133911132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,1,power_law_1.2,1.2862591743469238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,1,power_law_1.2,1.679212760925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,1,power_law_1.2,1.9879232406616212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,1,power_law_1.2,2.705267143249512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,1,power_law_1.2,3.4434368133544924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,1,power_law_1.2,4.154073715209961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,1,power_law_1.2,6.310438537597657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,power_law_1.2,0.03700479865074158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,power_law_1.2,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,1,power_law_1.2,12.190624237060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,power_law_1.2,0.042131200432777405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,power_law_1.2,0.04827519953250885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,power_law_1.2,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.032864001393318173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,power_law_1.2,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.037363201379776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,power_law_1.2,0.04806399941444397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,power_law_1.2,0.055238401889801024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.04965119957923889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,power_law_1.2,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,power_law_1.2,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,power_law_1.2,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.04801279902458191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,power_law_1.2,0.09331200122833253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,power_law_1.2,0.10232959985733033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,power_law_1.2,0.12957439422607422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.056409597396850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,power_law_1.2,0.17668479681015015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,power_law_1.2,0.2043328046798706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,power_law_1.2,0.30179200172424314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,power_law_1.2,0.3866048097610474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,power_law_1.2,0.5100863933563232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.09226239919662475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,power_law_1.2,0.7089600086212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.1115007996559143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,power_law_1.2,0.9628800392150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.12788480520248413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,power_law_1.2,1.380083179473877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.1672127962112427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.18725759983062745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,power_law_1.2,2.730521583557129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,power_law_1.01,0.26140799522399905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.03147520124912262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,power_law_1.01,0.3363647937774658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.033932799100875856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,power_law_1.01,0.4788991928100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,power_law_1.01,0.6128511905670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.03880960047245026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,power_law_1.01,0.7646016120910645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,power_law_1.01,1.3050687789916993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.04499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,power_law_1.01,2.3808767318725588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.050521600246429446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.05194240212440491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.06566399931907654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.11133439540863037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.12813440561294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.16745599508285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.18506239652633666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,power_law_1.2,0.2563391923904419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,power_law_1.2,0.3308160066604614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,power_law_1.2,0.47772798538208006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,power_law_1.2,0.6059328079223633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,power_law_1.2,0.7601471900939941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,power_law_1.2,1.3173376083374024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,power_law_1.2,2.342361640930176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,power_law_1.01,0.06629760265350342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,power_law_1.01,0.0793727993965149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,power_law_1.01,0.061791998147964475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,power_law_1.01,0.06097279787063599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,power_law_1.01,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,power_law_1.01,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,power_law_1.01,0.06321280002593994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,power_law_1.2,0.06746879816055298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,power_law_1.01,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,power_law_1.2,0.07157120108604431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,power_law_1.01,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,power_law_1.2,0.06214399933815003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,power_law_1.01,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,power_law_1.2,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,power_law_1.01,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,power_law_1.2,0.06051200032234192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,power_law_1.01,0.0925055980682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,power_law_1.2,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,power_law_1.01,0.10559359788894654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,power_law_1.2,0.06030719876289368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,power_law_1.01,0.12323199510574341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,power_law_1.2,0.06542720198631287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,power_law_1.01,0.1711359977722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,power_law_1.01,0.1664255976676941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,power_law_1.2,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,power_law_1.01,0.23054080009460448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,power_law_1.2,0.07895039916038513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,power_law_1.01,0.2553215980529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,power_law_1.2,0.07626240253448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,power_law_1.01,0.3587392091751099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,power_law_1.01,0.33104639053344725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,power_law_1.2,0.0844543993473053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,power_law_1.01,0.5174719810485839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,power_law_1.01,0.38857600688934324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,power_law_1.2,0.1016767978668213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,power_law_1.01,0.7998847961425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,power_law_1.01,0.6271872043609619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,power_law_1.2,0.11723519563674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,power_law_1.01,0.9956735610961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,power_law_1.2,0.13299200534820557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,power_law_1.01,0.9444160461425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,power_law_1.01,1.4953727722167969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,power_law_1.2,0.1676095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,power_law_1.01,1.0246912002563477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,power_law_1.01,2.0436416625976563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,power_law_1.2,0.17067519426345826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,power_law_1.01,1.9493568420410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,power_law_1.2,0.22087039947509765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,power_law_1.01,2.4980800628662108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,power_law_1.01,3.236537551879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,power_law_1.2,0.2695807933807373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,power_law_1.01,4.294988632202148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,power_law_1.01,0.06198400259017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,power_law_1.2,0.3830591917037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,power_law_1.2,0.49365758895874023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,power_law_1.01,8.562419128417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,power_law_1.01,0.057062399387359616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,power_law_1.2,0.7424960136413574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,power_law_1.01,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,power_law_1.2,0.9902976036071778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,power_law_1.2,1.5186752319335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,power_law_1.01,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,power_law_1.2,1.9048704147338866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,power_law_1.01,0.06382719874382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,power_law_1.2,2.748102378845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,power_law_1.2,4.157324981689453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,power_law_1.01,0.06772480010986329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,power_law_1.2,8.572601318359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,power_law_1.01,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,power_law_1.01,0.0695360004901886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,power_law_1.01,0.07509120106697083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,power_law_1.01,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,power_law_1.01,0.0918720006942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,power_law_1.01,0.10110080242156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,power_law_1.01,0.11175040006637574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,power_law_1.01,0.1453376054763794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,power_law_1.01,0.16028800010681152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,power_law_1.01,0.2495807886123657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,power_law_1.01,0.2551104068756104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,power_law_1.01,0.32739839553833006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,power_law_1.01,0.5735743999481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,power_law_1.01,0.7269824028015137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,power_law_1.01,1.0345855712890626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,power_law_1.01,1.3714752197265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,power_law_1.01,1.8374015808105468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,power_law_1.01,2.652422332763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,power_law_1.01,6.350502395629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,power_law_1.2,0.0662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,power_law_1.2,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,power_law_1.2,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,power_law_1.2,0.05824000239372253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,power_law_1.01,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,power_law_1.2,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,power_law_1.01,0.04477440118789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,power_law_1.2,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,power_law_1.01,0.055232000350952146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,power_law_1.01,0.058297598361968996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,power_law_1.01,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,power_law_1.2,0.06766719818115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,power_law_1.01,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,power_law_1.2,0.06971520185470581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,power_law_1.01,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,power_law_1.2,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,power_law_1.01,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,power_law_1.2,0.06807680130004883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,power_law_1.2,0.047814399003982544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,power_law_1.01,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,power_law_1.2,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,power_law_1.2,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,power_law_1.01,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,power_law_1.2,0.07708799839019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,power_law_1.2,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,power_law_1.2,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,power_law_1.2,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,power_law_1.01,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,power_law_1.2,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,power_law_1.2,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,power_law_1.01,0.06812800168991089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,power_law_1.2,0.058841598033905027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,power_law_1.2,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,power_law_1.01,0.07878400087356567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,power_law_1.2,0.05948160290718078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,power_law_1.2,0.11190400123596192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,power_law_1.2,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,power_law_1.01,0.08388479948043823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,power_law_1.2,0.14261120557785034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,power_law_1.2,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,power_law_1.01,0.08347520232200623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,power_law_1.2,0.17252479791641234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,power_law_1.2,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,power_law_1.01,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,power_law_1.2,0.1970944046974182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,power_law_1.01,0.11379200220108032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,power_law_1.2,0.349452805519104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,power_law_1.01,0.16560640335083007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,power_law_1.2,0.43485441207885744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,power_law_1.2,0.07382400035858154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,power_law_1.01,0.16909439563751222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,power_law_1.2,0.5296768188476563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,power_law_1.2,0.0760703980922699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,power_law_1.01,0.23751039505004884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,power_law_1.2,0.7977663993835449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,power_law_1.2,0.08489599823951721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,power_law_1.01,0.2796927928924561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,power_law_1.2,1.0320639610290527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,power_law_1.2,0.08590720295906067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,power_law_1.01,0.40051841735839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,power_law_1.2,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,power_law_1.2,1.5907584190368653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,power_law_1.01,0.5092607975006104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,power_law_1.2,0.10759680271148682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,power_law_1.2,2.368179130554199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,power_law_1.01,0.7769216060638428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,power_law_1.2,0.11723519563674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.035148799419403076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,power_law_1.2,3.0405311584472656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,power_law_1.01,0.896947193145752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,power_law_1.2,0.145907199382782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.03985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,power_law_1.01,1.3739263534545898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,power_law_1.2,0.16106879711151123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,power_law_1.2,6.669817352294922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,power_law_1.01,2.139468765258789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,power_law_1.2,0.23355519771575928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,power_law_1.2,0.2935551881790161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,power_law_1.01,3.784832000732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,power_law_1.2,0.41254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.058905601501464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,power_law_1.2,0.6247360229492187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.05994240045547485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,power_law_1.2,0.8248255729675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,power_law_1.2,1.0505215644836425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.0599295973777771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,power_law_1.2,1.3615936279296874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.06381440162658691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,power_law_1.2,2.131635284423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,power_law_1.2,4.4552959442138675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.07180799841880799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.06874240040779114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.0769216001033783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.0785535991191864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.08588799834251404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.09781759977340698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.12014720439910889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.1338688015937805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,power_law_1.01,0.21169281005859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,power_law_1.01,0.25155839920043943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,power_law_1.01,0.3515712022781372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,power_law_1.01,0.44946560859680174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,power_law_1.01,0.6524096012115479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,power_law_1.01,0.8362624168395996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,power_law_1.01,1.058067226409912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,power_law_1.01,1.6710271835327148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,power_law_1.01,3.3651905059814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,power_law_1.01,0.1568127989768982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,power_law_1.01,0.15968639850616456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,power_law_1.01,0.12445440292358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,power_law_1.01,0.09660159945487976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,power_law_1.01,0.09987840056419373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,power_law_1.01,0.12384639978408814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,power_law_1.01,0.14247039556503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,power_law_1.2,0.16595840454101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,power_law_1.01,0.14595839977264405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,power_law_1.2,0.15594880580902098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,power_law_1.01,0.14287999868392945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.04083200097084046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,power_law_1.2,0.08794879913330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,power_law_1.01,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.041459199786186215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,power_law_1.2,0.09244800209999085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,power_law_1.01,0.15619200468063354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,power_law_1.2,0.10758399963378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,power_law_1.01,0.1615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.06027519702911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,power_law_1.2,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,power_law_1.01,0.1576192021369934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,power_law_1.2,0.13463040590286254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,power_law_1.01,0.1643839955329895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,power_law_1.2,0.1348479986190796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.061318397521972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,power_law_1.01,0.1789247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.061919999122619626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,power_law_1.2,0.14754559993743896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,power_law_1.01,0.1971519947052002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.065830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,power_law_1.2,0.15062400102615356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,power_law_1.01,0.17176320552825927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,power_law_1.2,0.16188160181045533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.07339519858360291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,power_law_1.01,0.1994047999382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.06951680183410644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,power_law_1.2,0.16433279514312743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,power_law_1.01,0.205132794380188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.07667840123176575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,power_law_1.01,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,power_law_1.2,0.16433919668197633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,power_law_1.01,0.2362623929977417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.07811200022697448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,power_law_1.01,0.17726080417633056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,power_law_1.2,0.17950079441070557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,power_law_1.01,0.27720959186553956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.08692479729652405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,power_law_1.01,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,power_law_1.2,0.2016063928604126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.09838079810142517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,power_law_1.01,0.34092159271240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,power_law_1.01,0.08163840174674988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.11802239418029785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,power_law_1.2,0.20816640853881835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,power_law_1.01,0.38904318809509275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.13443200588226317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,power_law_1.01,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,power_law_1.2,0.18851200342178345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,power_law_1.01,0.4941120147705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.15614720582962036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,power_law_1.01,0.11831040382385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,power_law_1.2,0.2167680025100708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,power_law_1.2,0.21000959873199462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,power_law_1.01,0.6593791961669921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,power_law_1.01,0.13140480518341063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,power_law_1.2,0.23006720542907716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,power_law_1.2,0.24995200634002684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,power_law_1.01,0.9473343849182129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,power_law_1.01,0.14493440389633178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,power_law_1.2,0.2683903932571411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,power_law_1.2,0.3504960060119629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,power_law_1.01,1.2522879600524903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,power_law_1.2,0.4490047931671143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,power_law_1.01,0.1430848002433777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,power_law_1.2,0.28906879425048826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,power_law_1.2,0.6519487857818603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,power_law_1.01,0.14165760278701783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,power_law_1.01,1.364095973968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,power_law_1.2,0.3750848054885864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,power_law_1.2,0.8375040054321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,power_law_1.01,0.14697599411010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,power_law_1.2,0.465388822555542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,power_law_1.01,2.607033538818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,power_law_1.2,1.0593024253845216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,power_law_1.01,0.1584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,power_law_1.2,0.6206208229064941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,power_law_1.2,1.6661439895629884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,power_law_1.01,4.663423919677735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,power_law_1.01,0.15863679647445678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,power_law_1.2,0.7969535827636719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,power_law_1.2,3.3364673614501954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,power_law_1.01,0.17605119943618774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,power_law_1.2,1.2342016220092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,power_law_1.01,0.18893439769744874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,power_law_1.2,1.6919296264648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,power_law_1.01,0.1946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,power_law_1.2,1.928883171081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,power_law_1.01,0.1903872013092041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,power_law_1.01,0.20308480262756348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,power_law_1.2,2.8844736099243162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,power_law_1.01,0.20103039741516113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,power_law_1.01,0.23422720432281494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,power_law_1.2,7.5778556823730465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,power_law_1.01,0.2575040102005005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,power_law_1.01,0.306713604927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,power_law_1.01,0.36570239067077637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,power_law_1.01,0.4883711814880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,power_law_1.01,0.5772736072540283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,power_law_1.01,0.8924480438232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,power_law_1.01,1.0683775901794434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,power_law_1.01,1.3079487800598144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,power_law_1.01,2.0305152893066407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,power_law_1.01,3.8986366271972654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,power_law_1.2,0.11237119436264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,power_law_1.2,0.16622719764709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,power_law_1.01,0.08363519906997681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,power_law_1.2,0.06976640224456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,power_law_1.01,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,power_law_1.2,0.08104320168495179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,power_law_1.01,0.07626879811286927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,power_law_1.2,0.09415040016174317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,power_law_1.01,0.07790719866752624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,power_law_1.2,0.10807679891586304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,power_law_1.2,0.13838080167770386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,power_law_1.01,0.09592959880828858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,power_law_1.2,0.14351999759674072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,power_law_1.01,0.11210880279541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,power_law_1.2,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,power_law_1.2,0.14022400379180908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,power_law_1.01,0.1295040011405945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,power_law_1.2,0.11253759860992432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,power_law_1.2,0.14492160081863403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,power_law_1.01,0.13893760442733766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,power_law_1.2,0.06624640226364135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,power_law_1.2,0.15107840299606323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,power_law_1.01,0.14385279417037963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,power_law_1.2,0.0840448021888733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,power_law_1.2,0.15230720043182372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,power_law_1.01,0.14664959907531738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,power_law_1.2,0.16274559497833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,power_law_1.2,0.09511680006980897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,power_law_1.01,0.14979840517044068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,power_law_1.2,0.16889599561691285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,power_law_1.2,0.10802559852600098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,power_law_1.01,0.15286400318145751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,power_law_1.2,0.1842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,power_law_1.2,0.13089920282363893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,power_law_1.01,0.1652351975440979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,power_law_1.2,0.20677759647369384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,power_law_1.2,0.1401792049407959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,power_law_1.01,0.17907840013504028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,power_law_1.2,0.1883455991744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,power_law_1.2,0.14796160459518432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,power_law_1.01,0.18317439556121826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,power_law_1.2,0.21743359565734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,power_law_1.2,0.1508095979690552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,power_law_1.01,0.1876863956451416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,power_law_1.2,0.21008639335632323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,power_law_1.2,0.16188160181045533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,power_law_1.01,0.19178240299224852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,power_law_1.2,0.156550395488739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,power_law_1.2,0.25102078914642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,power_law_1.01,0.20650880336761473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,power_law_1.2,0.16227840185165404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,power_law_1.2,0.2667840003967285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,power_law_1.01,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,power_law_1.01,0.2151103973388672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,power_law_1.2,0.18606719970703126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,power_law_1.2,0.35852799415588377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,power_law_1.01,0.24870400428771972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,power_law_1.2,0.1934272050857544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,power_law_1.01,0.07509120106697083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,power_law_1.2,0.41075839996337893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,power_law_1.01,0.26981120109558104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,power_law_1.2,0.1966976046562195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,power_law_1.01,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,power_law_1.2,0.5326208114624024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,power_law_1.01,0.32366080284118653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,power_law_1.2,0.19794559478759766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,power_law_1.01,0.0949504017829895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,power_law_1.2,0.6733248233795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,power_law_1.01,0.40497918128967286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,power_law_1.2,0.22271358966827393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,power_law_1.01,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,power_law_1.2,1.1027839660644532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,power_law_1.01,0.49816322326660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,power_law_1.2,0.2237312078475952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,power_law_1.01,0.13263360261917115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,power_law_1.2,1.246553611755371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,power_law_1.01,0.6148928165435791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,power_law_1.01,0.14349440336227418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,power_law_1.2,0.2642751932144165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,power_law_1.01,0.8702783584594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,power_law_1.2,1.5265088081359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,power_law_1.01,0.14984960556030275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,power_law_1.2,0.28270080089569094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,power_law_1.01,1.0969792366027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,power_law_1.2,2.484556770324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,power_law_1.01,0.15045119524002076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,power_law_1.2,0.35151360034942625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,power_law_1.01,1.3112128257751465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,power_law_1.01,0.15803519487380982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,power_law_1.2,0.4055935859680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,power_law_1.2,5.626816177368164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,power_law_1.01,0.15495680570602416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,power_law_1.01,1.9555072784423828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,power_law_1.2,0.5414976119995117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,power_law_1.01,0.16662399768829345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,power_law_1.2,0.6904640197753906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,power_law_1.01,4.197043228149414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,power_law_1.01,0.18424960374832153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,power_law_1.2,0.9525440216064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,power_law_1.01,0.19325439929962157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,power_law_1.2,1.1842368125915528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,power_law_1.01,0.20677120685577394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,power_law_1.2,1.6317312240600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,power_law_1.01,0.20349440574645997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,power_law_1.01,0.23442559242248534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,power_law_1.2,2.271808052062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,power_law_1.01,0.24241280555725098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,power_law_1.2,4.388531112670899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,power_law_1.01,0.2868544101715088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,power_law_1.01,0.3144320011138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,power_law_1.01,0.38863999843597413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,power_law_1.01,0.4522687911987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,power_law_1.01,0.6026559829711914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,power_law_1.01,0.7441728115081787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,power_law_1.01,1.006719970703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,power_law_1.01,1.2829695701599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,power_law_1.01,1.5682751655578613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,power_law_1.01,2.3907007217407226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,power_law_1.01,5.073638534545898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,power_law_1.2,0.08677120208740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,power_law_1.2,0.06382719874382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,power_law_1.2,0.07367039918899536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,power_law_1.2,0.09414399862289428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,power_law_1.2,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,power_law_1.2,0.135315203666687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,power_law_1.2,0.14206720590591432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,power_law_1.2,0.1424831986427307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,power_law_1.2,0.15230079889297485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,power_law_1.01,0.06254079937934875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,power_law_1.2,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,power_law_1.2,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,power_law_1.2,0.17114880084991455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,power_law_1.01,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,power_law_1.2,0.1903488039970398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,power_law_1.01,0.07709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,power_law_1.2,0.19941760301589967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,power_law_1.01,0.1002303957939148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,power_law_1.2,0.21251199245452881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,power_law_1.01,0.12030080556869507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,power_law_1.2,0.06439039707183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,power_law_1.2,0.21251199245452881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,power_law_1.01,0.14753279685974122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,power_law_1.2,0.2350208044052124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,power_law_1.01,0.15777920484542846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,power_law_1.2,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,power_law_1.2,0.24507520198822022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,power_law_1.01,0.16188160181045533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,power_law_1.2,0.08181120157241821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,power_law_1.2,0.29361279010772706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,power_law_1.01,0.16474239826202391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,power_law_1.2,0.09861119985580444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,power_law_1.2,0.33025920391082764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,power_law_1.01,0.17702399492263793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,power_law_1.2,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,power_law_1.2,0.41239042282104493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,power_law_1.01,0.18235520124435425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,power_law_1.2,0.14878079891204835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,power_law_1.2,0.4941247940063477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,power_law_1.01,0.19219199419021607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,power_law_1.2,0.16024320125579833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,power_law_1.01,0.19996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,power_law_1.2,0.6376768112182617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,power_law_1.2,0.1645248055458069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,power_law_1.01,0.21553919315338135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,power_law_1.2,0.8039744377136231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,power_law_1.2,0.16803200244903566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,power_law_1.01,0.21901440620422363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,power_law_1.2,1.0452223777770997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,power_law_1.2,0.17909120321273803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,power_law_1.01,0.23130240440368652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,power_law_1.2,1.553542423248291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,power_law_1.2,0.18625919818878173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,power_law_1.01,0.26467199325561525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,power_law_1.2,1.6473344802856444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,power_law_1.2,0.20366721153259276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,power_law_1.01,0.3074879884719849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,power_law_1.2,2.5877824783325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,power_law_1.2,0.20899200439453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,power_law_1.01,0.36708478927612304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,power_law_1.2,0.23172481060028077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,power_law_1.01,0.44040961265563966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,power_law_1.2,5.674931335449219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,power_law_1.2,0.2347775936126709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,power_law_1.01,0.5571135997772216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,power_law_1.2,0.24012160301208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,power_law_1.01,0.6222655773162842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,power_law_1.2,0.2804608106613159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,power_law_1.01,0.8338303565979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,power_law_1.2,0.3173311948776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,power_law_1.01,1.0504960060119628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,power_law_1.2,0.38265600204467776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,power_law_1.01,1.3873920440673828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,power_law_1.2,0.4367231845855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,power_law_1.01,1.8406080245971679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,power_law_1.2,0.5452608108520508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,power_law_1.01,2.1279359817504884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,power_law_1.2,0.6360000133514404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,power_law_1.2,0.8403519630432129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,power_law_1.01,3.3090049743652346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,power_law_1.2,1.1019136428833007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.0767359972000122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,power_law_1.01,6.40417251586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.09413759708404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,power_law_1.2,1.4238656044006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.12360960245132446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,power_law_1.2,2.0521728515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.14615679979324342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,power_law_1.2,2.28851203918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.1815808057785034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,power_law_1.2,3.5347263336181642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.19203200340270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.19775359630584716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,power_law_1.2,6.877881622314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.2075968027114868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.2211008071899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.22376320362091065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.234604811668396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,power_law_1.01,0.25217280387878416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,power_law_1.01,0.2605695962905884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,power_law_1.01,0.27026560306549074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,power_law_1.01,0.2921663999557495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,power_law_1.01,0.35872640609741213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,power_law_1.01,0.06704639792442321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,power_law_1.01,0.40767998695373536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,power_law_1.01,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,power_law_1.01,0.5088255882263184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,power_law_1.01,0.044300800561904906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,power_law_1.01,0.5891583919525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,power_law_1.01,0.049235200881958006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,power_law_1.01,0.7793856143951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,power_law_1.01,0.05414400100708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,power_law_1.01,0.05906559824943543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,power_law_1.01,0.9538751602172851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,power_law_1.01,0.06111360192298889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,power_law_1.2,0.05783680081367493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,power_law_1.01,1.3186367988586425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,power_law_1.01,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,power_law_1.2,0.050860798358917235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,power_law_1.01,1.6432319641113282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,power_law_1.01,0.05885440111160278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,power_law_1.2,0.04780800044536591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,power_law_1.01,2.2586624145507814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,power_law_1.01,0.05926399827003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,power_law_1.2,0.051910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,power_law_1.01,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,power_law_1.2,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,power_law_1.01,2.866374397277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,power_law_1.01,0.06110079884529114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,power_law_1.01,3.5036479949951174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,power_law_1.01,0.061740797758102414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,power_law_1.2,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,power_law_1.01,5.361382293701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,power_law_1.2,0.06644480228424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,power_law_1.2,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,power_law_1.01,10.395295715332031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,power_law_1.2,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,power_law_1.2,0.07545599937438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,power_law_1.2,0.07505279779434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,power_law_1.2,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,power_law_1.2,0.07416319847106934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,power_law_1.2,0.08053119778633118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,power_law_1.2,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,power_law_1.2,0.09388800263404846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,power_law_1.2,0.09696000218391418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,power_law_1.2,0.12195199728012085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,power_law_1.2,0.14262399673461915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.0775488018989563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,power_law_1.2,0.20817279815673828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.08983680009841918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,power_law_1.2,0.23393280506134034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,power_law_1.2,0.41276798248291013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,power_law_1.2,0.4494272232055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.13797119855880738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,power_law_1.2,0.884607982635498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.1801535964012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,power_law_1.2,1.2776191711425782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.1891711950302124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,power_law_1.01,0.04296320080757141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,power_law_1.01,0.042105600237846375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.1932736039161682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,power_law_1.2,1.2636927604675292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,power_law_1.01,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.2072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,power_law_1.2,2.5619264602661134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.2176448106765747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,power_law_1.2,4.972627258300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.2256256103515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,power_law_1.01,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,power_law_1.2,0.2362623929977417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,power_law_1.2,0.24960000514984132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,power_law_1.01,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,power_law_1.01,0.06198400259017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,power_law_1.2,0.26594560146331786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,power_law_1.01,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,power_law_1.2,0.2784640073776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,power_law_1.2,0.306713604927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,power_law_1.01,0.07141119837760926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,power_law_1.2,0.3687551975250244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,power_law_1.01,0.06586880087852479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,power_law_1.2,0.45848960876464845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,power_law_1.01,0.07037439942359924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,power_law_1.2,0.542848014831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,power_law_1.01,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,power_law_1.2,0.6026559829711914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,power_law_1.01,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,power_law_1.01,0.09494400024414062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,power_law_1.2,0.789631986618042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,power_law_1.01,0.0847104012966156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,power_law_1.2,0.9727295875549317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,power_law_1.01,0.10436480045318604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,power_law_1.2,1.3350208282470704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,power_law_1.01,0.12117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,power_law_1.2,0.05804160237312317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,power_law_1.2,1.6616704940795899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,power_law_1.01,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,power_law_1.2,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,power_law_1.2,2.2742336273193358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,power_law_1.01,0.1682752013206482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,power_law_1.2,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,power_law_1.01,0.23728640079498292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,power_law_1.2,2.895609664916992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,power_law_1.2,0.045561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,power_law_1.01,0.2741503953933716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,power_law_1.2,0.045561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,power_law_1.2,3.501171112060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,power_law_1.01,0.3689791917800903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,power_law_1.2,0.055801600217819214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,power_law_1.2,5.359743881225586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,power_law_1.2,0.055801600217819214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,power_law_1.01,0.5285120010375977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,power_law_1.2,0.05782399773597717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,power_law_1.01,0.6202688217163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,power_law_1.2,0.05846400260925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,power_law_1.2,10.378572845458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,power_law_1.01,0.996070384979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,power_law_1.2,0.05989760160446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,power_law_1.2,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,power_law_1.01,2.109164810180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,power_law_1.2,0.06521599888801574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,power_law_1.2,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,power_law_1.2,0.06726400256156921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,power_law_1.2,0.07258880138397217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,power_law_1.2,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,power_law_1.2,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,power_law_1.2,0.10085120201110839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,power_law_1.2,0.09348480105400085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,power_law_1.2,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,power_law_1.2,0.14056960344314576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,power_law_1.2,0.16802560091018676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,power_law_1.2,0.2069375991821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,power_law_1.2,0.2618304014205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,power_law_1.2,0.32673280239105223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,power_law_1.2,0.6046592235565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,power_law_1.2,0.8850367546081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,power_law_1.01,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,power_law_1.2,1.0279680252075196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,power_law_1.2,0.041280001401901245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,power_law_1.01,0.04622719883918762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,power_law_1.2,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,power_law_1.2,1.4447360038757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,power_law_1.01,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,power_law_1.2,0.039852800965309146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,power_law_1.2,3.6836414337158203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,power_law_1.01,0.05562880039215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,power_law_1.2,0.04334079921245575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,power_law_1.2,0.044563201069831845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,power_law_1.01,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,power_law_1.2,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,power_law_1.01,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,power_law_1.2,0.05707520246505737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,power_law_1.2,0.06158080101013184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,power_law_1.01,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,power_law_1.2,0.06251519918441772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,power_law_1.01,0.06846719980239868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,power_law_1.2,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,power_law_1.01,0.06752640008926392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,power_law_1.2,0.07099519968032837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,power_law_1.01,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,power_law_1.01,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,power_law_1.2,0.06483200192451477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,power_law_1.01,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,power_law_1.2,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,power_law_1.01,0.08329600095748901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,power_law_1.01,0.0896448016166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,power_law_1.2,0.08082559704780579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,power_law_1.01,0.09906560182571411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,power_law_1.2,0.09966080188751221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,power_law_1.01,0.10951039791107178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,power_law_1.2,0.10005760192871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,power_law_1.01,0.12683520317077637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,power_law_1.2,0.11605119705200195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,power_law_1.01,0.1559999942779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,power_law_1.2,0.1307904005050659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,power_law_1.01,0.1850816011428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,power_law_1.01,0.03712640106678009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,power_law_1.2,0.17441920042037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,power_law_1.01,0.23934719562530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,power_law_1.01,0.037363201379776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,power_law_1.2,0.1952831983566284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,power_law_1.01,0.3327359914779663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,power_law_1.01,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,power_law_1.2,0.2870527982711792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,power_law_1.01,0.4238592147827148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,power_law_1.01,0.04207360148429871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,power_law_1.2,0.3773695945739746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,power_law_1.01,0.047814399003982544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,power_law_1.01,0.5322175979614258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,power_law_1.2,0.529747200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,power_law_1.01,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,power_law_1.01,0.6716800212860108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,power_law_1.01,0.061740797758102414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,power_law_1.2,0.6712512016296387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,power_law_1.01,0.9485440254211426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,power_law_1.01,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,power_law_1.2,0.8899840354919434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,power_law_1.01,0.06664959788322448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,power_law_1.01,1.996518325805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,power_law_1.2,1.1474111557006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,power_law_1.01,0.06644480228424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,power_law_1.01,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,power_law_1.2,2.5079103469848634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,power_law_1.01,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,power_law_1.01,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,power_law_1.01,0.08119040131568908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,power_law_1.01,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,power_law_1.01,0.09102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,power_law_1.01,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,power_law_1.01,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,power_law_1.01,0.14222079515457153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,power_law_1.01,0.15077120065689087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,power_law_1.01,0.18154239654541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,power_law_1.01,0.22946560382843018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,power_law_1.01,0.3371968030929565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,power_law_1.01,0.3750848054885864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,power_law_1.01,0.571065616607666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,power_law_1.01,0.7072127819061279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,power_law_1.01,0.8649663925170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,power_law_1.01,1.3243264198303222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,power_law_1.2,0.03312000036239624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,power_law_1.01,2.566431999206543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,power_law_1.2,0.0429504007101059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,power_law_1.01,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,power_law_1.2,0.0486847996711731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,power_law_1.2,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,power_law_1.01,0.07709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,power_law_1.01,0.03617280125617981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,power_law_1.2,0.058905601501464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,power_law_1.01,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,power_law_1.01,0.03495039939880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,power_law_1.2,0.06299520134925843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,power_law_1.01,0.04088320136070252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,power_law_1.2,0.06547200083732604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,power_law_1.01,0.11518720388412476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,power_law_1.2,0.06691200137138367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,power_law_1.01,0.13648639917373656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,power_law_1.2,0.06935679912567139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,power_law_1.01,0.0677183985710144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,power_law_1.01,0.17068159580230713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,power_law_1.2,0.07345920205116271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,power_law_1.01,0.06913279891014099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,power_law_1.01,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,power_law_1.2,0.07674239873886109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,power_law_1.01,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,power_law_1.01,0.2689919948577881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,power_law_1.2,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,power_law_1.01,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,power_law_1.01,0.28024959564208984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,power_law_1.01,0.07263360023498536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,power_law_1.2,0.08061439990997314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,power_law_1.01,0.45554561614990235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,power_law_1.01,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,power_law_1.2,0.08492159843444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,power_law_1.01,0.6267583847045899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,power_law_1.01,0.08060799837112427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,power_law_1.2,0.09107199907302857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,power_law_1.01,0.8166272163391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,power_law_1.01,0.08062080144882203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,power_law_1.2,0.10234240293502808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,power_law_1.01,0.08513280153274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,power_law_1.2,0.11175040006637574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,power_law_1.01,1.1436927795410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,power_law_1.01,0.09843199849128723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,power_law_1.2,0.14083839654922486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,power_law_1.01,2.472217559814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,power_law_1.2,0.15783679485321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,power_law_1.01,0.10847359895706177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,power_law_1.2,0.20023679733276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,power_law_1.01,0.12856320142745972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,power_law_1.2,0.26679680347442625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,power_law_1.2,0.03735679984092712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,power_law_1.01,0.14328320026397706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,power_law_1.2,0.34236159324646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,power_law_1.2,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,power_law_1.01,0.17863039970397948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,power_law_1.2,0.0416703999042511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,power_law_1.2,0.4445504188537598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,power_law_1.01,0.21456639766693114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,power_law_1.2,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,power_law_1.2,0.6888703823089599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,power_law_1.01,0.28603520393371584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,power_law_1.2,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,power_law_1.2,0.7580927848815918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,power_law_1.2,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,power_law_1.01,0.3290431976318359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,power_law_1.2,1.0034496307373046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,power_law_1.2,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,power_law_1.01,0.4420928001403809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,power_law_1.2,1.613337516784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,power_law_1.2,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,power_law_1.01,0.5388224124908447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,power_law_1.2,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,power_law_1.01,0.7937280178070069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,power_law_1.2,3.3484031677246096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,power_law_1.2,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,power_law_1.01,1.0116288185119628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,power_law_1.2,0.07443199753761291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,power_law_1.01,1.1367615699768066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,power_law_1.2,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,power_law_1.2,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,power_law_1.01,1.8209983825683593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,power_law_1.2,0.08999680280685425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,power_law_1.01,3.3819839477539064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,power_law_1.2,0.09799039959907532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,power_law_1.2,0.10085760354995728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,power_law_1.2,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,power_law_1.2,0.13239680528640746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,power_law_1.2,0.1438655972480774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,power_law_1.2,0.18032000064849854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,power_law_1.2,0.22189440727233886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,power_law_1.2,0.28142719268798827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,power_law_1.2,0.3623744010925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,power_law_1.2,0.48833279609680175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,power_law_1.2,0.5976960182189941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,power_law_1.2,0.8629183769226074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,power_law_1.2,1.101433563232422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,power_law_1.2,1.290329647064209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,power_law_1.2,2.0644607543945312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.03715200126171112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,power_law_1.2,3.7245697021484374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.08094080090522766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.0840511977672577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.08937600255012512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.09448320269584656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.09715840220451355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.036185601353645326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.10863360166549682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.039263999462127684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.11619199514389038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,power_law_1.01,0.11441279649734497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.12194559574127198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,power_law_1.01,0.10088959932327271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.04888960123062134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.1340224027633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,power_law_1.01,0.08533120155334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.16187520027160646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,power_law_1.01,0.09310719966888428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.07612800002098083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.18992639780044557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,power_law_1.01,0.09578239917755127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.08104320168495179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.24379520416259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,power_law_1.01,0.11789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,power_law_1.01,0.29253759384155276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,power_law_1.01,0.11544320583343506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.08554880023002624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,power_law_1.01,0.11829760074615478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,power_law_1.01,0.12178560495376586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,power_law_1.01,0.11972479820251465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.09598079919815064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,power_law_1.01,0.12853120565414428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.0980288028717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,power_law_1.2,0.11831040382385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.125273597240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.13674240112304686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,power_law_1.2,0.14468480348587037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.16418559551239015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,power_law_1.2,0.08672000169754028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.19122560024261476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,power_law_1.2,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.2459007978439331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,power_law_1.2,0.09921919703483581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,power_law_1.2,0.29443199634552003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,power_law_1.2,0.10638079643249512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,power_law_1.2,0.40482559204101565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,power_law_1.2,0.11723519563674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,power_law_1.2,0.5186944007873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,power_law_1.2,0.121343994140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,power_law_1.2,0.11642240285873413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,power_law_1.2,0.6831552028656006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,power_law_1.2,0.12543359994888306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,power_law_1.2,0.8531135559082031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,power_law_1.2,0.12522239685058595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,power_law_1.2,1.1969920158386231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,power_law_1.2,0.13279999494552613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,power_law_1.2,1.5371520042419433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,power_law_1.2,0.13565440177917482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,power_law_1.2,1.9027263641357421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,power_law_1.2,0.1573632001876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,power_law_1.2,0.16639360189437866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,power_law_1.2,2.9356735229492186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,power_law_1.2,0.17989120483398438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,power_law_1.2,5.654668807983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,power_law_1.2,0.19137920141220094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,power_law_1.2,0.16843520402908324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,power_law_1.2,0.1872704029083252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,power_law_1.2,0.22577919960021972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,power_law_1.2,0.28743040561676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,power_law_1.2,0.33064320087432864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,power_law_1.2,0.4850560188293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,power_law_1.2,0.4981696128845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,power_law_1.2,0.6417344093322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,power_law_1.2,0.944422435760498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,power_law_1.2,1.418131160736084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,power_law_1.2,2.150079917907715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,power_law_1.2,2.757491111755371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,power_law_1.2,4.096640014648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,power_law_1.2,9.925644683837891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,power_law_1.01,0.11043839454650879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,power_law_1.01,0.11257599592208863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,power_law_1.01,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,power_law_1.01,0.08144639730453491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,power_law_1.01,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,power_law_1.01,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,power_law_1.01,0.11066240072250366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,power_law_1.01,0.11708799600601197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,power_law_1.01,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,power_law_1.01,0.11953279972076417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,power_law_1.01,0.12444159984588624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,power_law_1.01,0.13304959535598754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,power_law_1.01,0.13299200534820557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,power_law_1.01,0.13961600065231322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,power_law_1.01,0.14718079566955566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,power_law_1.01,0.17564799785614013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,power_law_1.01,0.15660159587860106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,power_law_1.01,0.1801535964012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,power_law_1.2,0.11294080018997192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,power_law_1.01,0.1863103985786438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,power_law_1.2,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,power_law_1.01,0.22500479221343994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,power_law_1.2,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,power_law_1.01,0.24774401187896727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,power_law_1.2,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,power_law_1.2,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,power_law_1.01,0.31674880981445314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,power_law_1.2,0.1110975980758667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,power_law_1.01,0.3337536096572876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,power_law_1.2,0.11662720441818238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,power_law_1.01,0.4773375988006592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,power_law_1.2,0.11989760398864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,power_law_1.01,0.6243711948394776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,power_law_1.2,0.12502399682998658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,power_law_1.01,0.8535360336303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,power_law_1.2,0.13157119750976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,power_law_1.01,1.1437312126159669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,power_law_1.2,0.13731199502944946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,power_law_1.01,1.4554368019104005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,power_law_1.2,0.14099839925765992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,power_law_1.2,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,power_law_1.01,2.3522623062133787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,power_law_1.2,0.1397696018218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,power_law_1.01,4.495091247558594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,power_law_1.2,0.14467840194702147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,power_law_1.2,0.1450943946838379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,power_law_1.2,0.1670207977294922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,power_law_1.2,0.20509440898895265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,power_law_1.2,0.21636478900909423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,power_law_1.2,0.264902400970459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,power_law_1.2,0.3132352113723755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,power_law_1.2,0.35050239562988283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,power_law_1.2,0.43466877937316895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,power_law_1.2,0.6618048191070557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,power_law_1.2,0.7142335891723632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,power_law_1.2,1.0949567794799804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,power_law_1.2,1.436563205718994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,power_law_1.2,1.8529151916503905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,power_law_1.2,3.24310417175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,power_law_1.2,9.619961547851563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,power_law_1.01,0.08492799997329711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,power_law_1.01,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,power_law_1.01,0.06321280002593994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,power_law_1.01,0.07979519963264466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,power_law_1.01,0.09005439877510071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,power_law_1.01,0.11175680160522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,power_law_1.01,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,power_law_1.01,0.12362879514694214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,power_law_1.01,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,power_law_1.01,0.13489919900894165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,power_law_1.01,0.13919999599456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,power_law_1.01,0.14410879611968994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,power_law_1.01,0.40434560775756834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,power_law_1.01,0.136735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,power_law_1.01,0.5006080150604248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,power_law_1.01,0.14043519496917725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,power_law_1.01,0.6798079967498779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,power_law_1.01,0.14123519659042358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,power_law_1.01,0.851039981842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,power_law_1.01,0.13214720487594606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,power_law_1.01,0.1520959973335266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,power_law_1.01,1.2018431663513183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,power_law_1.01,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,power_law_1.01,0.17136000394821166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,power_law_1.2,0.08918399810791015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,power_law_1.01,1.5416000366210938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,power_law_1.01,0.15595519542694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,power_law_1.01,0.18567680120468139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,power_law_1.2,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,power_law_1.01,1.8948863983154296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,power_law_1.01,0.16725759506225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,power_law_1.01,0.21783039569854737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,power_law_1.2,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,power_law_1.01,0.1690816044807434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,power_law_1.01,0.23136639595031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,power_law_1.2,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,power_law_1.01,2.9188863754272463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,power_law_1.01,0.16171519756317138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,power_law_1.01,0.2934015989303589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,power_law_1.2,0.0844543993473053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,power_law_1.01,5.669760131835938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,power_law_1.01,0.18199039697647096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,power_law_1.2,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,power_law_1.01,0.3587519884109497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,power_law_1.01,0.20350079536437987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,power_law_1.2,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,power_law_1.01,0.5014912128448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,power_law_1.2,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,power_law_1.01,0.2551104068756104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,power_law_1.01,0.6018303871154785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,power_law_1.2,0.1254271984100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,power_law_1.01,0.27784318923950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,power_law_1.01,0.8326399803161622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,power_law_1.2,0.130348801612854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,power_law_1.01,0.3548352003097534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,power_law_1.01,1.0720640182495118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,power_law_1.2,0.1373247981071472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,power_law_1.01,0.3906816005706787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,power_law_1.01,1.1256959915161133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,power_law_1.2,0.14365439414978026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,power_law_1.01,0.6161600112915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,power_law_1.01,1.9408191680908202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,power_law_1.2,0.1532863974571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,power_law_1.01,0.6909120082855225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,power_law_1.2,0.1371135950088501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,power_law_1.01,0.9145664215087891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,power_law_1.01,3.7704830169677734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,power_law_1.2,0.14665600061416625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,power_law_1.01,1.2576000213623046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,power_law_1.2,0.15326080322265626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,power_law_1.01,1.6837823867797852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,power_law_1.2,0.15779199600219726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,power_law_1.2,0.17418880462646485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,power_law_1.01,2.723155212402344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,power_law_1.2,0.19997440576553344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,power_law_1.2,0.24012160301208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,power_law_1.01,5.737535858154297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,power_law_1.2,0.2614207983016968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,power_law_1.2,0.34415359497070314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,power_law_1.2,0.41459197998046876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,power_law_1.2,0.5178175926208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,power_law_1.2,0.6251455783843994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,power_law_1.2,0.9153471946716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,power_law_1.2,1.4508928298950194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,power_law_1.2,1.4982080459594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,power_law_1.2,2.3272384643554687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,power_law_1.2,5.697427368164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,power_law_1.01,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,power_law_1.01,0.0713536024093628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,power_law_1.01,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,power_law_1.01,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,power_law_1.01,0.09142400026321411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,power_law_1.01,0.10862720012664795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,power_law_1.01,0.1188480019569397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,power_law_1.01,0.12132480144500732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,power_law_1.01,0.12378239631652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,power_law_1.01,0.12910720109939575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,power_law_1.01,0.1356608033180237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,power_law_1.2,0.06424319744110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,power_law_1.01,0.1364799976348877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,power_law_1.2,0.058508801460266116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,power_law_1.2,0.06444799900054932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,power_law_1.2,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,power_law_1.2,0.08347520232200623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,power_law_1.2,0.11299200057983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,power_law_1.2,0.11953920125961304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,power_law_1.2,0.125273597240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,power_law_1.2,0.12936960458755492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,power_law_1.2,0.13059840202331544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,power_law_1.01,0.05679360032081604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,power_law_1.2,0.13755520582199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,power_law_1.2,0.14042880535125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,power_law_1.01,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,power_law_1.2,0.14124159812927245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,power_law_1.01,0.07837439775466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,power_law_1.2,0.14780800342559813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,power_law_1.01,0.09413120150566101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,power_law_1.2,0.15476479530334472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,power_law_1.01,0.12485120296478272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,power_law_1.2,0.1627392053604126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,power_law_1.01,0.13100160360336305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,power_law_1.2,0.16479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,power_law_1.01,0.13162239789962768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,power_law_1.2,0.1836351990699768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,power_law_1.01,0.13953280448913574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,power_law_1.2,0.2018752098083496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,power_law_1.01,0.13960959911346435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,power_law_1.2,0.2454848051071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,power_law_1.01,0.14778239727020265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,power_law_1.2,0.05968639850616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,power_law_1.2,0.29033598899841306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,power_law_1.01,0.15066239833831788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,power_law_1.2,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,power_law_1.2,0.3626368045806885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,power_law_1.01,0.15084799528121948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,power_law_1.2,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,power_law_1.01,0.16253440380096434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,power_law_1.2,0.4330751895904541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,power_law_1.2,0.07893760204315185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,power_law_1.01,0.1702911972999573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,power_law_1.2,0.0906175971031189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,power_law_1.2,0.5485824108123779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,power_law_1.01,0.1859007954597473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,power_law_1.2,0.12337919473648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,power_law_1.2,0.7707903861999512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,power_law_1.2,0.131167995929718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,power_law_1.01,0.19735679626464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,power_law_1.2,1.0034624099731446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,power_law_1.2,0.13276159763336182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,power_law_1.01,0.23461759090423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,power_law_1.2,1.3927680015563966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,power_law_1.2,0.13690240383148194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,power_law_1.01,0.25939838886260985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,power_law_1.2,1.6956800460815429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,power_law_1.2,0.14202239513397216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,power_law_1.01,0.30792319774627686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,power_law_1.2,2.4738943099975588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,power_law_1.2,0.14939520359039307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,power_law_1.01,0.36890881061553954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,power_law_1.2,0.1561344027519226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,power_law_1.01,0.4555967807769775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,power_law_1.2,6.768160247802735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,power_law_1.2,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,power_law_1.01,0.5850304126739502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,power_law_1.2,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,power_law_1.01,0.7449791908264161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,power_law_1.2,0.18399360179901122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,power_law_1.01,0.9469183921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,power_law_1.2,0.19404159784317015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,power_law_1.01,1.2559552192687988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,power_law_1.2,0.20774400234222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,power_law_1.01,1.723103904724121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,power_law_1.2,0.24865920543670655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,power_law_1.2,0.26428799629211425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,power_law_1.01,2.1665088653564455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,power_law_1.2,0.31630721092224123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,power_law_1.01,3.0115072250366213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,power_law_1.2,0.3687295913696289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,power_law_1.2,0.4518847942352295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,power_law_1.01,6.221535873413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,power_law_1.2,0.5919680118560791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,power_law_1.2,0.7587967872619629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,power_law_1.2,0.939027214050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,power_law_1.2,1.363167953491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,power_law_1.2,1.6993215560913086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,power_law_1.2,2.1173120498657227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,power_law_1.2,3.4229183197021484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,power_law_1.2,6.9567619323730465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,power_law_1.01,0.16270079612731933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,power_law_1.01,0.21163520812988282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.061382400989532473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,power_law_1.01,0.23725440502166747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.09127680063247681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,power_law_1.01,0.10536320209503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.10786559581756591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,power_law_1.01,0.13198720216751098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.14800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,power_law_1.01,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.15516799688339233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.16028159856796265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,power_law_1.01,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.1662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,power_law_1.01,0.17417600154876708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.16705280542373657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,power_law_1.01,0.17110400199890136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.05419520139694214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.17647360563278197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.06239359974861145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.18137600421905517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,power_law_1.01,0.18031359910964967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.07180799841880799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.19162240028381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,power_law_1.01,0.17662719488143921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.20309760570526122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.08388479948043823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,power_law_1.01,0.19055360555648804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.21580159664154053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.10682879686355591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,power_law_1.01,0.1987391948699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.23299839496612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.1461632013320923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,power_law_1.01,0.20755200386047362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.253273606300354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.15208319425582886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,power_law_1.01,0.21042559146881104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,power_law_1.01,0.3124608039855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.16459519863128663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,power_law_1.01,0.36366078853607176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.16560640335083007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,power_law_1.01,0.2061311960220337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,power_law_1.01,0.46462078094482423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.1693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,power_law_1.01,0.2243583917617798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.18404480218887329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,power_law_1.01,0.5371071815490722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,power_law_1.01,0.2378688097000122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.19529600143432618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,power_law_1.01,0.690118408203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,power_law_1.01,0.24440960884094237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.2006335973739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,power_law_1.01,0.8760640144348144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,power_law_1.01,0.29910399913787844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.2073983907699585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,power_law_1.01,1.1461888313293458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,power_law_1.01,0.315065598487854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.2237760066986084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,power_law_1.01,1.3538559913635253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,power_law_1.01,0.3808000087738037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.23647360801696776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,power_law_1.01,1.888185691833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,power_law_1.01,0.4473728179931641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.2561471939086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,power_law_1.01,2.4575424194335938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,power_law_1.2,0.3210560083389282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,power_law_1.01,0.5542719841003418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,power_law_1.01,3.0045440673828123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,power_law_1.2,0.3685375928878784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,power_law_1.01,0.7166912078857421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,power_law_1.01,4.578636932373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,power_law_1.2,0.4724031925201416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,power_law_1.01,0.925267219543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,power_law_1.2,0.5403647899627686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,power_law_1.01,8.926547241210937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,power_law_1.01,1.1850687980651855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,power_law_1.2,0.6998655796051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,power_law_1.2,0.8760640144348144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,power_law_1.01,1.4977791786193848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,power_law_1.2,1.149459171295166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,power_law_1.01,2.169728088378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,power_law_1.2,1.3644415855407714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,power_law_1.2,1.888185691833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,power_law_1.01,4.3918720245361325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,power_law_1.01,0.14814720153808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,power_law_1.2,2.4243392944335938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,power_law_1.01,0.13935359716415405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,power_law_1.2,2.963999938964844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,power_law_1.01,0.14629759788513183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,power_law_1.01,0.1545024037361145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,power_law_1.2,4.580160140991211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,power_law_1.01,0.16596479415893556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,power_law_1.01,0.18358399868011474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,power_law_1.2,8.90155487060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,power_law_1.01,0.20447359085083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,power_law_1.01,0.23560960292816163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,power_law_1.01,0.276147198677063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,power_law_1.01,0.34639999866485593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,power_law_1.01,0.42381439208984373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,power_law_1.01,0.5391295909881592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,power_law_1.01,0.6769536018371582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,power_law_1.01,0.9263936042785644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,power_law_1.01,1.2137215614318848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,power_law_1.01,1.5378560066223144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,power_law_1.01,2.316089630126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,power_law_1.01,4.831059265136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,power_law_1.2,0.1588544011116028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,power_law_1.2,0.2155071973800659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,power_law_1.2,0.1551743984222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,power_law_1.2,0.1017151951789856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,power_law_1.2,0.10784640312194824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,power_law_1.2,0.1438976049423218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,power_law_1.01,0.11406079530715943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,power_law_1.2,0.14206080436706542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,power_law_1.01,0.16844160556793214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,power_law_1.2,0.1699136018753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,power_law_1.01,0.2413503885269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,power_law_1.2,0.16459519863128663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,power_law_1.01,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,power_law_1.2,0.18084479570388795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,power_law_1.01,0.09921919703483581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,power_law_1.2,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,power_law_1.2,0.1832128047943115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,power_law_1.01,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,power_law_1.2,0.1678655982017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,power_law_1.2,0.19224319458007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,power_law_1.01,0.1438655972480774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,power_law_1.2,0.17604479789733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,power_law_1.2,0.17995519638061525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,power_law_1.01,0.1631168007850647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,power_law_1.2,0.08554239869117737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,power_law_1.2,0.20412158966064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,power_law_1.01,0.17249280214309692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,power_law_1.2,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,power_law_1.2,0.2006592035293579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,power_law_1.01,0.17723519802093507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,power_law_1.2,0.11706240177154541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,power_law_1.2,0.20780799388885499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,power_law_1.01,0.17990399599075318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,power_law_1.2,0.12670079469680787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,power_law_1.2,0.21987199783325195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,power_law_1.01,0.18544000387191772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,power_law_1.2,0.1643839955329895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,power_law_1.2,0.24324479103088378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,power_law_1.01,0.19178880453109742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,power_law_1.2,0.25347840785980225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,power_law_1.2,0.16725120544433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,power_law_1.01,0.1880959987640381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,power_law_1.2,0.3155200004577637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,power_law_1.01,0.20796799659729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,power_law_1.2,0.16582399606704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,power_law_1.2,0.35669119358062745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,power_law_1.01,0.21431679725646974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,power_law_1.2,0.1756351947784424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,power_law_1.01,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,power_law_1.2,0.44863362312316896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,power_law_1.01,0.21103360652923583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,power_law_1.2,0.18096640110015869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,power_law_1.01,0.1123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,power_law_1.2,0.5211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,power_law_1.01,0.22680959701538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,power_law_1.2,0.18833279609680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,power_law_1.01,0.17129600048065186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,power_law_1.01,0.25137920379638673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,power_law_1.2,0.7105984210968017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,power_law_1.2,0.19018880128860474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,power_law_1.01,0.07667840123176575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,power_law_1.01,0.27083520889282225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,power_law_1.2,0.8502655982971191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,power_law_1.2,0.20369279384613037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,power_law_1.01,0.09409279823303222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,power_law_1.01,0.30237441062927245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,power_law_1.2,0.21454079151153566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,power_law_1.2,1.1232704162597655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,power_law_1.01,0.12624640464782716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,power_law_1.01,0.35255680084228513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,power_law_1.2,0.21495680809020995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,power_law_1.01,0.14262399673461915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,power_law_1.2,1.5567999839782716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,power_law_1.2,0.23215999603271484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,power_law_1.01,0.39697918891906736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,power_law_1.01,0.15851520299911498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,power_law_1.2,1.7403135299682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,power_law_1.2,0.25141119956970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,power_law_1.01,0.5071616172790527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,power_law_1.01,0.1786687970161438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,power_law_1.2,2.986528015136719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,power_law_1.2,0.30140159130096433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,power_law_1.01,0.17210880517959595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,power_law_1.01,0.6304448127746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,power_law_1.2,6.4906494140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,power_law_1.2,0.33293440341949465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,power_law_1.01,0.1840000033378601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,power_law_1.01,0.9165311813354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,power_law_1.01,0.1876863956451416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,power_law_1.2,0.41893758773803713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,power_law_1.01,1.0810111999511718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,power_law_1.01,0.18890880346298217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,power_law_1.2,0.46460800170898436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,power_law_1.01,1.391487979888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,power_law_1.01,0.19137279987335204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,power_law_1.2,0.6067391872406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,power_law_1.01,2.160313606262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,power_law_1.01,0.21286399364471437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,power_law_1.2,0.717139196395874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,power_law_1.01,4.235961532592773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,power_law_1.01,0.22086400985717775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,power_law_1.2,0.9469120025634765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,power_law_1.01,0.23620479106903075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,power_law_1.2,1.3153471946716309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,power_law_1.01,0.24830079078674316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,power_law_1.2,1.8082496643066406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,power_law_1.01,0.26119680404663087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,power_law_1.2,2.492742347717285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,power_law_1.01,0.30543999671936034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,power_law_1.01,0.30339200496673585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,power_law_1.2,5.310995101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,power_law_1.01,0.37405440807342527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,power_law_1.01,0.43752322196960447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,power_law_1.01,0.529695987701416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,power_law_1.01,0.7236415863037109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,power_law_1.01,0.9345215797424317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,power_law_1.01,1.1649855613708495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,power_law_1.01,1.4168831825256347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,power_law_1.01,2.1736896514892576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,power_law_1.01,3.897836685180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,power_law_1.2,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,power_law_1.2,0.11175040006637574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,power_law_1.2,0.0998848021030426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,power_law_1.2,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,power_law_1.2,0.08799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,power_law_1.2,0.11504000425338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,power_law_1.2,0.13101439476013182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,power_law_1.2,0.15967999696731566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,power_law_1.2,0.1643839955329895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,power_law_1.2,0.17011840343475343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,power_law_1.01,0.06644480228424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,power_law_1.2,0.18098560571670533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,power_law_1.2,0.17524479627609252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,power_law_1.01,0.12010879516601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,power_law_1.2,0.19040640592575073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,power_law_1.01,0.07525759935379028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,power_law_1.2,0.18855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,power_law_1.01,0.10003199577331542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,power_law_1.2,0.19693440198898315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,power_law_1.01,0.12665599584579468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,power_law_1.2,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,power_law_1.2,0.20492799282073976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,power_law_1.01,0.14550399780273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,power_law_1.2,0.23054080009460448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,power_law_1.01,0.167193603515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,power_law_1.2,0.08512639999389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,power_law_1.2,0.24651520252227782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,power_law_1.01,0.16966400146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,power_law_1.2,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,power_law_1.2,0.2739583969116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,power_law_1.01,0.18481919765472413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,power_law_1.2,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,power_law_1.2,0.30732159614562987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,power_law_1.01,0.1958847999572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,power_law_1.2,0.11420799493789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,power_law_1.2,0.32330880165100095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,power_law_1.01,0.2048896074295044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,power_law_1.2,0.1320255994796753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,power_law_1.2,0.40460801124572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,power_law_1.01,0.19955840110778808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,power_law_1.2,0.47854080200195315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,power_law_1.2,0.15762560367584227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,power_law_1.01,0.21226239204406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,power_law_1.2,0.578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,power_law_1.2,0.17155840396881103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,power_law_1.01,0.22680959701538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,power_law_1.01,0.23274240493774415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,power_law_1.2,0.17237759828567506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,power_law_1.2,0.7249343872070313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,power_law_1.01,0.24790399074554442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,power_law_1.2,0.1883455991744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,power_law_1.2,1.0095935821533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,power_law_1.01,0.26572160720825194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,power_law_1.2,0.18833279609680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,power_law_1.2,1.283347225189209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,power_law_1.01,0.289683198928833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,power_law_1.2,0.20594561100006104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,power_law_1.2,1.6887168884277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,power_law_1.01,0.34946560859680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,power_law_1.2,0.20799999237060546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,power_law_1.2,2.506278419494629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,power_law_1.01,0.3691456079483032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,power_law_1.2,0.2219264030456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,power_law_1.01,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,power_law_1.01,0.442464017868042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,power_law_1.2,0.23011200428009032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,power_law_1.2,4.988479995727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,power_law_1.01,0.06971520185470581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,power_law_1.01,0.5276415824890137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,power_law_1.2,0.24917120933532716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,power_law_1.01,0.09347839951515198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,power_law_1.01,0.6708159923553467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,power_law_1.2,0.27394559383392336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,power_law_1.01,0.08282880187034607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,power_law_1.01,0.8219455718994141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,power_law_1.2,0.3058880090713501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,power_law_1.01,0.1092352032661438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,power_law_1.01,1.1109312057495118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,power_law_1.2,0.3554368019104004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,power_law_1.01,0.13566720485687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,power_law_1.2,0.3745151996612549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,power_law_1.01,0.15040639638900757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,power_law_1.01,1.452518367767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,power_law_1.2,0.4646143913269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,power_law_1.01,0.18091520071029663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,power_law_1.01,1.7181440353393556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,power_law_1.01,0.19054720401763917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,power_law_1.2,0.5534912109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,power_law_1.01,2.5697023391723635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,power_law_1.01,0.19339519739151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,power_law_1.2,0.7027904033660889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,power_law_1.01,5.1202880859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,power_law_1.01,0.20999679565429688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,power_law_1.2,0.8772095680236817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,power_law_1.01,0.2165247917175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,power_law_1.2,1.1654272079467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,power_law_1.01,0.22577280998229982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,power_law_1.2,1.4826815605163575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,power_law_1.01,0.22802560329437255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,power_law_1.2,1.9039552688598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,power_law_1.01,0.24563839435577392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,power_law_1.2,2.8734720230102537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,power_law_1.01,0.25566720962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,power_law_1.01,0.2702080011367798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,power_law_1.2,5.650956726074218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,power_law_1.01,0.30831360816955566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,power_law_1.01,0.3474112033843994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,power_law_1.01,0.4096127986907959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,power_law_1.01,0.48504958152770994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,power_law_1.01,0.6053247928619385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,power_law_1.01,0.7289663791656494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,power_law_1.01,0.9304767608642578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,power_law_1.01,1.1752256393432616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,power_law_1.01,1.5259648323059083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,power_law_1.01,1.9477247238159179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,power_law_1.01,2.396447944641113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,power_law_1.01,3.619308853149414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,power_law_1.01,6.882323455810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,power_law_1.2,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,power_law_1.2,0.0695680022239685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,power_law_1.2,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,power_law_1.2,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,power_law_1.2,0.09905279874801635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,power_law_1.2,0.12977919578552247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,power_law_1.2,0.14226560592651366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,power_law_1.01,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,power_law_1.2,0.17686400413513184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,power_law_1.01,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,power_law_1.01,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,power_law_1.2,0.18261760473251343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,power_law_1.2,0.18507519960403443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,power_law_1.01,0.039212799072265624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,power_law_1.2,0.20677120685577394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,power_law_1.01,0.03939839899539947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,power_law_1.2,0.21127040386199952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,power_law_1.01,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,power_law_1.01,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,power_law_1.2,0.218451189994812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,power_law_1.01,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,power_law_1.2,0.23176960945129393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,power_law_1.01,0.04083200097084046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,power_law_1.01,0.045747199654579164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,power_law_1.2,0.25245440006256104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,power_law_1.01,0.04718720018863678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,power_law_1.2,0.25143680572509763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,power_law_1.01,0.0488319993019104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,power_law_1.01,0.05681279897689819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,power_law_1.2,0.2796992063522339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,power_law_1.01,0.06275200247764587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,power_law_1.2,0.31409919261932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,power_law_1.01,0.06438400149345398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,power_law_1.01,0.07623680233955384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,power_law_1.2,0.36296958923339845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,power_law_1.01,0.08732799887657165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,power_law_1.2,0.44332160949707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,power_law_1.01,0.1172287940979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,power_law_1.2,0.5039423942565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,power_law_1.01,0.14364160299301149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,power_law_1.01,0.19239039421081544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,power_law_1.2,0.6202752113342285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,power_law_1.01,0.20979840755462648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,power_law_1.2,0.7351679801940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,power_law_1.01,0.32899200916290283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,power_law_1.01,0.4020927906036377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,power_law_1.2,0.9608575820922851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,power_law_1.01,0.5985023975372314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,power_law_1.2,1.2707072257995606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.07279999852180481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,power_law_1.01,0.8387328147888183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,power_law_1.01,1.045580768585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.0785152018070221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,power_law_1.2,1.6534847259521483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,power_law_1.01,1.6775936126708983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.09737600088119507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,power_law_1.2,1.955571174621582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,power_law_1.01,3.522457504272461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.13073920011520385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,power_law_1.2,2.5075136184692384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.1643455982208252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,power_law_1.2,3.760243225097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.1913472056388855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.06749439835548401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,power_law_1.01,0.23152000904083253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,power_law_1.2,7.021907043457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.06894720196723939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,power_law_1.01,0.23478400707244873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.07938560247421264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,power_law_1.01,0.2435839891433716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.09331200122833253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,power_law_1.01,0.2628544092178345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.11954560279846191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,power_law_1.01,0.2718463897705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,power_law_1.2,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.1510655999183655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,power_law_1.01,0.28291199207305906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,power_law_1.2,0.037145599722862244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.16867200136184693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,power_law_1.2,0.037555199861526486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,power_law_1.01,0.29499518871307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,power_law_1.2,0.037350401282310486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,power_law_1.2,0.21722240447998048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,power_law_1.01,0.3064703941345215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,power_law_1.2,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,power_law_1.2,0.22663679122924804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,power_law_1.2,0.03758080005645752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,power_law_1.01,0.32264320850372313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,power_law_1.2,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,power_law_1.01,0.35413761138916017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,power_law_1.01,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,power_law_1.2,0.23564159870147705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,power_law_1.2,0.037363201379776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,power_law_1.01,0.03576320111751556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,power_law_1.01,0.42401919364929197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,power_law_1.2,0.2542912006378174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,power_law_1.01,0.036800000071525577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,power_law_1.2,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,power_law_1.01,0.4735743999481201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,power_law_1.01,0.037011200189590455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,power_law_1.2,0.26698880195617675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,power_law_1.2,0.04062080085277557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,power_law_1.01,0.5870528221130371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,power_law_1.2,0.27681920528411863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,power_law_1.2,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,power_law_1.01,0.03783040046691895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,power_law_1.2,0.048825600743293764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,power_law_1.01,0.6724544048309327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,power_law_1.01,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,power_law_1.2,0.29093759059906005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,power_law_1.2,0.05025280117988586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,power_law_1.01,0.041484799981117246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,power_law_1.01,0.8706879615783691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,power_law_1.2,0.3136768102645874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,power_law_1.2,0.056601601839065555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,power_law_1.01,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,power_law_1.2,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,power_law_1.01,1.1162431716918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,power_law_1.01,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,power_law_1.2,0.3251456022262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,power_law_1.2,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,power_law_1.01,0.04455040097236633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,power_law_1.2,0.3591487884521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,power_law_1.01,1.443507194519043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,power_law_1.2,0.07873280048370361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,power_law_1.01,0.047865599393844604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,power_law_1.2,0.09040639996528625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,power_law_1.01,0.04540160000324249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,power_law_1.2,0.4257023811340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,power_law_1.01,1.886502456665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,power_law_1.2,0.11558400392532349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,power_law_1.01,0.055852800607681274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,power_law_1.2,0.47813758850097654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,power_law_1.01,2.524448013305664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,power_law_1.01,0.05624960064888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,power_law_1.2,0.14160640239715577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,power_law_1.01,0.06240000128746033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,power_law_1.2,0.5993216037750244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,power_law_1.2,0.19956480264663695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,power_law_1.01,3.103615951538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,power_law_1.2,0.24174718856811522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,power_law_1.2,0.6909120082855225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,power_law_1.01,0.08144639730453491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,power_law_1.2,0.3529599905014038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,power_law_1.01,3.7503807067871096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,power_law_1.2,0.8911999702453614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,power_law_1.01,0.10520319938659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,power_law_1.2,0.41685757637023924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,power_law_1.01,0.1144063949584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,power_law_1.01,5.766252899169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,power_law_1.2,0.6136576175689697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,power_law_1.2,1.1212032318115235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,power_law_1.01,0.15886080265045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,power_law_1.2,0.8391360282897949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,power_law_1.01,0.1938752055168152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,power_law_1.2,1.451743984222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,power_law_1.2,1.0596991539001466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,power_law_1.01,11.038182067871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,power_law_1.01,0.2989376068115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,power_law_1.2,1.6263935089111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,power_law_1.2,1.9133695602416991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,power_law_1.01,0.34973440170288084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,power_law_1.2,3.4892288208007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,power_law_1.01,0.4985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,power_law_1.2,2.551321601867676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,power_law_1.01,0.777350378036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,power_law_1.2,3.0987455368041994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,power_law_1.01,0.8752384185791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,power_law_1.01,1.338310432434082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,power_law_1.2,3.765574264526367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,power_law_1.01,2.9183359146118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,power_law_1.2,5.7768512725830075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,power_law_1.2,11.023481750488282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,power_law_1.2,0.03675520122051239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,power_law_1.2,0.04044159948825836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,power_law_1.2,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,power_law_1.2,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,power_law_1.01,0.0344895988702774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,power_law_1.2,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,power_law_1.01,0.035718399286270144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,power_law_1.2,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,power_law_1.01,0.035724800825119016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,power_law_1.2,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,power_law_1.2,0.038387200236320494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,power_law_1.01,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,power_law_1.2,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,power_law_1.2,0.03860479891300202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,power_law_1.01,0.03797119855880737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,power_law_1.2,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,power_law_1.2,0.04042240083217621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,power_law_1.01,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,power_law_1.2,0.04454399943351746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,power_law_1.01,0.03901439905166626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,power_law_1.2,0.03598720133304596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,power_law_1.2,0.04534400105476379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,power_law_1.01,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,power_law_1.2,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,power_law_1.01,0.03309440016746521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,power_law_1.01,0.041043201088905336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,power_law_1.2,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,power_law_1.01,0.03310079872608185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,power_law_1.01,0.039603200554847715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,power_law_1.2,0.056409597396850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,power_law_1.01,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,power_law_1.2,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,power_law_1.01,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,power_law_1.2,0.06439039707183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,power_law_1.2,0.0744383990764618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,power_law_1.2,0.0834496021270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,power_law_1.2,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,power_law_1.2,0.12503039836883545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,power_law_1.2,0.16965759992599488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,power_law_1.2,0.22045440673828126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,power_law_1.2,0.2517888069152832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,power_law_1.2,0.3388351917266846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,power_law_1.2,0.5071807861328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,power_law_1.2,0.8521920204162597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,power_law_1.2,0.9309056282043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,power_law_1.2,1.3120384216308594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,power_law_1.2,3.0064767837524413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,power_law_1.2,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,power_law_1.2,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,power_law_1.2,0.03552640080451965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,power_law_1.2,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,power_law_1.2,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,power_law_1.2,0.04103040099143982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,power_law_1.2,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,power_law_1.2,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,power_law_1.2,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,power_law_1.2,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,power_law_1.2,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,power_law_1.2,0.04513919949531555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,power_law_1.2,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,power_law_1.2,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,power_law_1.2,0.05824000239372253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,power_law_1.2,0.06152960062026978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,power_law_1.2,0.05989760160446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,power_law_1.2,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,power_law_1.2,0.10412160158157349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,power_law_1.2,0.11960959434509277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,power_law_1.2,0.15983999967575074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,power_law_1.2,0.18481279611587526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,power_law_1.2,0.25785601139068604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,power_law_1.2,0.3244927883148193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,power_law_1.2,0.4662208080291748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,power_law_1.2,0.598521614074707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,power_law_1.2,0.7375936031341552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,power_law_1.2,1.1740032196044923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,power_law_1.2,2.3518144607543947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,power_law_1.01,0.04325119853019714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,power_law_1.01,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,power_law_1.01,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,power_law_1.01,0.04264320135116577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,power_law_1.01,0.0433023989200592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,power_law_1.01,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,power_law_1.01,0.048019200563430786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,power_law_1.01,0.04924800097942352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,power_law_1.01,0.04924800097942352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,power_law_1.01,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,power_law_1.01,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,power_law_1.01,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,power_law_1.01,0.07587199807167053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,power_law_1.01,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,power_law_1.01,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,power_law_1.01,0.10824320316314698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,power_law_1.01,0.1201024055480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,power_law_1.01,0.16966400146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,power_law_1.01,0.17909120321273803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,power_law_1.01,0.25793919563293455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,power_law_1.01,0.3142528057098389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,power_law_1.01,0.49939842224121095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,power_law_1.01,0.609984016418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,power_law_1.01,0.906719970703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,power_law_1.01,1.3021504402160644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,power_law_1.01,1.5039551734924317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,power_law_1.01,2.4677248001098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,power_law_1.01,4.951948928833008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,power_law_1.2,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,power_law_1.2,0.04139519929885864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,power_law_1.2,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,power_law_1.2,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,power_law_1.2,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,power_law_1.2,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,power_law_1.2,0.045561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,power_law_1.2,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,power_law_1.2,0.04496000111103058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,power_law_1.2,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,power_law_1.2,0.05121920108795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,power_law_1.2,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,power_law_1.2,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,power_law_1.2,0.07894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,power_law_1.2,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,power_law_1.2,0.08806399703025818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,power_law_1.2,0.11007360219955445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,power_law_1.2,0.12747520208358765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,power_law_1.2,0.1630911946296692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,power_law_1.2,0.1966976046562195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,power_law_1.2,0.27411839962005613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,power_law_1.2,0.35185918807983396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,power_law_1.2,0.5009856224060059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,power_law_1.2,0.6263679981231689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,power_law_1.2,0.9419648170471191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,power_law_1.2,1.3218688011169433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,power_law_1.2,1.6673664093017577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,power_law_1.2,2.6348480224609374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,power_law_1.2,5.123168182373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,power_law_1.2,0.03880960047245026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,power_law_1.01,0.03473280072212219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,power_law_1.01,0.03783040046691895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,power_law_1.01,0.03863039910793305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,power_law_1.2,0.04069760143756866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,power_law_1.2,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,power_law_1.01,0.040057599544525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,power_law_1.2,0.04336000084877014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,power_law_1.2,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,power_law_1.01,0.04128639996051788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,power_law_1.2,0.053395199775695804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,power_law_1.01,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,power_law_1.2,0.0576960027217865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,power_law_1.01,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,power_law_1.2,0.07428479790687562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,power_law_1.01,0.04579200148582459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,power_law_1.2,0.07652480006217957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,power_law_1.01,0.04863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,power_law_1.2,0.10213119983673095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,power_law_1.01,0.053376001119613645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,power_law_1.2,0.11707520484924316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,power_law_1.01,0.04126079976558685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,power_law_1.01,0.055219197273254396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,power_law_1.2,0.14697599411010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,power_law_1.01,0.04106239974498749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,power_law_1.01,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,power_law_1.2,0.19428479671478271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,power_law_1.01,0.04126079976558685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,power_law_1.01,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,power_law_1.2,0.25962879657745364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,power_law_1.01,0.04351359903812409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,power_law_1.01,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,power_law_1.2,0.34727039337158205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,power_law_1.01,0.04412800073623657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,power_law_1.01,0.10334080457687378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,power_law_1.2,0.5043647766113282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,power_law_1.01,0.045561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,power_law_1.01,0.12198400497436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,power_law_1.2,0.661030387878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,power_law_1.01,0.047603198885917665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,power_law_1.01,0.15884799957275392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,power_law_1.2,0.6667520046234131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,power_law_1.01,0.04863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,power_law_1.01,0.18362879753112793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,power_law_1.2,1.2190912246704102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,power_law_1.01,0.2559295892715454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,power_law_1.2,2.4124799728393556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,power_law_1.01,0.052934402227401735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,power_law_1.01,0.3235071897506714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,power_law_1.01,0.05170559883117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,power_law_1.01,0.4625664234161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,power_law_1.01,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,power_law_1.01,0.594048023223877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,power_law_1.01,0.0713536024093628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,power_law_1.01,0.7277823925018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,power_law_1.01,1.1748543739318849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,power_law_1.01,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,power_law_1.01,0.09612159729003907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,power_law_1.01,2.239833641052246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,power_law_1.01,0.11088639497756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,power_law_1.01,0.12788480520248413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,power_law_1.01,0.15383679866790773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,power_law_1.01,0.20694398880004883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,power_law_1.01,0.2659199953079224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,power_law_1.01,0.44819841384887693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,power_law_1.01,0.5088128089904785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,power_law_1.01,0.9149439811706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,power_law_1.01,0.9677760124206543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,power_law_1.2,0.05072640180587769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,power_law_1.01,1.2634943962097167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,power_law_1.2,0.04971520006656647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,power_law_1.01,2.016537666320801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,power_law_1.01,4.3076416015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,power_law_1.2,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,power_law_1.2,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,power_law_1.01,0.03824000060558319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,power_law_1.2,0.04847359955310822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,power_law_1.01,0.036985599994659425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,power_law_1.2,0.05400959849357605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,power_law_1.2,0.04744960069656372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,power_law_1.2,0.05052800178527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,power_law_1.2,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,power_law_1.01,0.04417920112609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,power_law_1.01,0.045798400044441225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,power_law_1.2,0.0695743978023529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,power_law_1.01,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,power_law_1.2,0.07386879920959473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,power_law_1.2,0.08082559704780579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,power_law_1.01,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,power_law_1.2,0.09085440039634704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,power_law_1.2,0.11623040437698365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,power_law_1.2,0.038380798697471616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,power_law_1.01,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,power_law_1.2,0.150655996799469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,power_law_1.2,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,power_law_1.01,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,power_law_1.2,0.18528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,power_law_1.2,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,power_law_1.2,0.23340160846710206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,power_law_1.2,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,power_law_1.01,0.07077760100364686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,power_law_1.2,0.26494081020355226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,power_law_1.2,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,power_law_1.01,0.07405440211296081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,power_law_1.2,0.4564032077789307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,power_law_1.2,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,power_law_1.01,0.09249280095100403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,power_law_1.2,0.6030655860900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,power_law_1.2,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,power_law_1.01,0.10191359519958496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,power_law_1.2,0.7183551788330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,power_law_1.2,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,power_law_1.01,0.1199295997619629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,power_law_1.2,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,power_law_1.2,1.0439935684204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,power_law_1.01,0.14042240381240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,power_law_1.2,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,power_law_1.2,1.504793643951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,power_law_1.01,0.19162880182266234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,power_law_1.2,0.04986239969730377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,power_law_1.2,2.3645503997802733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,power_law_1.01,0.250598406791687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,power_law_1.2,0.05107839703559876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,power_law_1.2,4.395334243774414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,power_law_1.01,0.33333120346069334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,power_law_1.2,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,power_law_1.2,0.05845119953155518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,power_law_1.01,0.4158656120300293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,power_law_1.2,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,power_law_1.01,0.6606016159057617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,power_law_1.2,0.0701312005519867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,power_law_1.01,0.846771240234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,power_law_1.2,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,power_law_1.01,1.1552000045776367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,power_law_1.2,0.0946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,power_law_1.01,1.5920319557189941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,power_law_1.2,0.1016767978668213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,power_law_1.2,0.12911360263824462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,power_law_1.01,3.5597503662109373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,power_law_1.2,0.1614016056060791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,power_law_1.2,0.2078847885131836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,power_law_1.2,0.23535358905792236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,power_law_1.2,0.34004480838775636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,power_law_1.2,0.4608895778656006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,power_law_1.2,0.7187007904052735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,power_law_1.2,0.9124735832214356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,power_law_1.2,1.1740032196044923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,power_law_1.2,1.8291391372680663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,power_law_1.2,3.284044647216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,power_law_1.01,0.03516800105571747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,power_law_1.01,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,power_law_1.01,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,power_law_1.01,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,power_law_1.01,0.043372800946235655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,power_law_1.01,0.04418559968471527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,power_law_1.01,0.04663679897785187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,power_law_1.01,0.04560000002384186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,power_law_1.2,0.03575679957866669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,power_law_1.01,0.04807040095329285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,power_law_1.2,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,power_law_1.01,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,power_law_1.2,0.04254080057144165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,power_law_1.2,0.043961599469184875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,power_law_1.01,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,power_law_1.2,0.04437119960784912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,power_law_1.01,0.06567040085792542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,power_law_1.01,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,power_law_1.2,0.04415999948978424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,power_law_1.01,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,power_law_1.2,0.047040000557899475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,power_law_1.01,0.10782079696655274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,power_law_1.01,0.07796480059623719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,power_law_1.01,0.09635199904441834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,power_law_1.01,0.08944000005722046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,power_law_1.2,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,power_law_1.01,0.08078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,power_law_1.01,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,power_law_1.2,0.04824959933757782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,power_law_1.01,0.13346560001373292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,power_law_1.2,0.05113599896430969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,power_law_1.01,0.14903039932250978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,power_law_1.2,0.05256320238113403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,power_law_1.01,0.1998080015182495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,power_law_1.2,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,power_law_1.01,0.24528000354766846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,power_law_1.2,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,power_law_1.01,0.34645121097564696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,power_law_1.01,0.4388160228729248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,power_law_1.01,0.6389120101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,power_law_1.01,0.8240256309509277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,power_law_1.01,1.0255743980407714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,power_law_1.01,1.6055679321289062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,power_law_1.01,3.1382976531982423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,power_law_1.2,0.11011840105056762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,power_law_1.2,0.1047935962677002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,power_law_1.2,0.06746240258216858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,power_law_1.2,0.07284479737281799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,power_law_1.01,0.0445248007774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,power_law_1.2,0.08203520178794861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,power_law_1.01,0.05066239833831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,power_law_1.2,0.08062080144882203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,power_law_1.01,0.055366402864456175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,power_law_1.01,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,power_law_1.2,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,power_law_1.01,0.06644480228424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,power_law_1.2,0.10110080242156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,power_law_1.01,0.07708799839019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,power_law_1.2,0.1074560046195984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,power_law_1.01,0.09592959880828858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,power_law_1.2,0.10315519571304321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,power_law_1.01,0.11558400392532349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,power_law_1.01,0.1475391983985901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,power_law_1.2,0.10764800310134888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,power_law_1.01,0.17045120000839234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,power_law_1.2,0.10951679944992065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,power_law_1.01,0.2528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,power_law_1.2,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,power_law_1.01,0.3232640027999878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,power_law_1.2,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,power_law_1.01,0.4932415962219238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,power_law_1.2,0.12177920341491699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,power_law_1.01,0.5952320098876953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,power_law_1.01,0.7039743900299072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,power_law_1.2,0.12978559732437134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,power_law_1.01,1.1096832275390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,power_law_1.2,0.14001920223236083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,power_law_1.01,2.3780031204223633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,power_law_1.2,0.15763200521469117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,power_law_1.2,0.1715648055076599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,power_law_1.2,0.21763839721679687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,power_law_1.2,0.2270656108856201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,power_law_1.2,0.30222721099853517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,power_law_1.2,0.3591487884521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,power_law_1.2,0.5264768123626709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,power_law_1.2,0.6589632034301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,power_law_1.2,0.9854335784912109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,power_law_1.2,1.2232000350952148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,power_law_1.2,1.5047103881835937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,power_law_1.01,0.0967423975467682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,power_law_1.2,2.3489919662475587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,power_law_1.01,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,power_law_1.2,6.033343887329101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,power_law_1.01,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,power_law_1.01,0.07196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,power_law_1.01,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,power_law_1.01,0.08568320274353028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,power_law_1.01,0.09920639991760254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,power_law_1.01,0.1024832010269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,power_law_1.01,0.10535680055618286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,power_law_1.01,0.10780800580978393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,power_law_1.01,0.10760320425033569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,power_law_1.01,0.11025919914245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,power_law_1.01,0.11558400392532349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,power_law_1.01,0.11558400392532349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,power_law_1.2,0.09208319783210754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,power_law_1.01,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,power_law_1.2,0.10766079425811767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,power_law_1.01,0.12910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,power_law_1.2,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,power_law_1.01,0.13689600229263305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,power_law_1.2,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,power_law_1.01,0.15325440168380738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,power_law_1.2,0.0769216001033783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,power_law_1.01,0.16332800388336183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,power_law_1.2,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,power_law_1.01,0.19556479454040526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,power_law_1.2,0.09475839734077454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,power_law_1.01,0.2201535940170288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,power_law_1.2,0.10008959770202637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,power_law_1.01,0.2831104040145874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,power_law_1.2,0.10376960039138794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,power_law_1.01,0.33882238864898684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,power_law_1.2,0.10540159940719604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,power_law_1.01,0.43137922286987307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,power_law_1.2,0.10807039737701415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,power_law_1.01,0.5718848228454589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,power_law_1.2,0.1082751989364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,power_law_1.01,0.7670591831207275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,power_law_1.2,0.11257599592208863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,power_law_1.01,1.0271679878234863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,power_law_1.2,0.12281600236892701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,power_law_1.01,1.2337984085083007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,power_law_1.2,0.13408000469207765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,power_law_1.2,0.13509759902954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,power_law_1.01,1.854547119140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,power_law_1.2,0.14247039556503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,power_law_1.01,3.7896705627441407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,power_law_1.2,0.16131839752197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,power_law_1.2,0.17073919773101806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,power_law_1.2,0.20636799335479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,power_law_1.2,0.23702399730682372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,power_law_1.2,0.30755200386047366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,power_law_1.2,0.3618175983428955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,power_law_1.2,0.4948671817779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,power_law_1.2,0.6014336109161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,power_law_1.2,0.8301888465881347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,power_law_1.2,1.1457216262817382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,power_law_1.2,1.5048064231872558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,power_law_1.2,2.0964736938476562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,power_law_1.01,0.07482879757881164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,power_law_1.2,4.748627090454102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,power_law_1.01,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,power_law_1.01,0.0670144021511078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,power_law_1.01,0.08118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,power_law_1.01,0.1049407958984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,power_law_1.01,0.10473599433898925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,power_law_1.01,0.11026560068130493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,power_law_1.01,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,power_law_1.01,0.11968640089035035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,power_law_1.01,0.11599999666213989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,power_law_1.01,0.12009600400924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,power_law_1.01,0.12314879894256592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,power_law_1.2,0.07365120053291321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,power_law_1.01,0.129312002658844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,power_law_1.2,0.1047935962677002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,power_law_1.01,0.13443200588226317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,power_law_1.2,0.058713597059249875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,power_law_1.01,0.14467840194702147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,power_law_1.2,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,power_law_1.01,0.08629760146141052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,power_law_1.01,0.16187520027160646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,power_law_1.2,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,power_law_1.01,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,power_law_1.01,0.17539199590682983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,power_law_1.2,0.08288000226020813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,power_law_1.01,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,power_law_1.01,0.2065216064453125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,power_law_1.2,0.10007679462432861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,power_law_1.01,0.09921280145645142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,power_law_1.2,0.06968320012092591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,power_law_1.01,0.24133760929107667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,power_law_1.2,0.10376960039138794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,power_law_1.01,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,power_law_1.2,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,power_law_1.01,0.30195839405059816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,power_law_1.2,0.1074560046195984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,power_law_1.01,0.10556800365447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,power_law_1.2,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,power_law_1.2,0.10825599431991577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,power_law_1.2,0.10703999996185302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,power_law_1.01,0.35742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,power_law_1.01,0.10781439542770385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,power_law_1.2,0.12670079469680787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,power_law_1.2,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,power_law_1.01,0.1065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,power_law_1.01,0.49117441177368165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,power_law_1.2,0.14697599411010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,power_law_1.2,0.11503360271453858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,power_law_1.01,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,power_law_1.01,0.6230463981628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,power_law_1.2,0.20064001083374022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,power_law_1.2,0.11667200326919555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,power_law_1.2,0.2420032024383545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,power_law_1.01,0.8575679779052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,power_law_1.2,0.3411263942718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,power_law_1.2,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,power_law_1.01,0.1268671989440918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,power_law_1.01,1.101088047027588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,power_law_1.2,0.4335040092468262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,power_law_1.2,0.13181439638137818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,power_law_1.01,0.1344256043434143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,power_law_1.2,0.6272255897521972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,power_law_1.01,1.319814395904541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,power_law_1.2,0.136953604221344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,power_law_1.01,0.13485440015792846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,power_law_1.2,0.8088831901550293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,power_law_1.2,0.14821120500564575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,power_law_1.01,2.057900810241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,power_law_1.01,0.15471359491348266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,power_law_1.2,1.0108287811279297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,power_law_1.2,0.167468798160553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,power_law_1.2,1.5809727668762208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,power_law_1.01,0.16393599510192872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,power_law_1.01,3.911763381958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,power_law_1.2,0.17933440208435059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,power_law_1.01,0.1954624056816101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,power_law_1.2,3.1184064865112306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,power_law_1.01,0.2220736026763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,power_law_1.2,0.21497600078582763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,power_law_1.01,0.2816960096359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,power_law_1.2,0.24405760765075685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,power_law_1.01,0.3273535966873169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,power_law_1.2,0.3132800102233887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,power_law_1.01,0.475648021697998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,power_law_1.2,0.37800960540771483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,power_law_1.2,0.5346496105194092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,power_law_1.01,0.5624639987945557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,power_law_1.2,0.6380799770355224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,power_law_1.01,0.8182527542114257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,power_law_1.2,0.8883456230163574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,power_law_1.01,1.0299903869628906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,power_law_1.01,1.2104448318481444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,power_law_1.2,1.1724032402038573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,power_law_1.2,1.4161151885986327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,power_law_1.01,1.9779327392578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,power_law_1.2,2.2631744384765624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,power_law_1.01,3.9641857147216797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,power_law_1.2,4.847552108764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,power_law_1.01,0.07400959730148315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,power_law_1.2,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,power_law_1.01,0.07627519965171814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,power_law_1.01,0.06724479794502258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,power_law_1.2,0.06424319744110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,power_law_1.01,0.06705920100212097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,power_law_1.01,0.08815360069274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,power_law_1.2,0.07959039807319641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,power_law_1.01,0.09552000164985656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,power_law_1.2,0.09619839787483216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,power_law_1.01,0.115174400806427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,power_law_1.2,0.11708159446716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,power_law_1.01,0.12337919473648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,power_law_1.2,0.11624319553375244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,power_law_1.01,0.12172800302505493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,power_law_1.2,0.1221824049949646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,power_law_1.2,0.12730239629745482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,power_law_1.01,0.13157119750976562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,power_law_1.2,0.13836159706115722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,power_law_1.01,0.13808640241622924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,power_law_1.2,0.1498304009437561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,power_law_1.01,0.14016640186309814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,power_law_1.2,0.14655359983444213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,power_law_1.01,0.14734079837799072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,power_law_1.2,0.14451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,power_law_1.01,0.1545024037361145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,power_law_1.2,0.1565888047218323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,power_law_1.01,0.15695359706878662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,power_law_1.2,0.16376960277557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,power_law_1.01,0.17006080150604247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,power_law_1.01,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,power_law_1.2,0.17727999687194823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,power_law_1.01,0.06358399987220764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,power_law_1.2,0.19775359630584716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,power_law_1.2,0.2170111894607544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,power_law_1.01,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,power_law_1.2,0.06954879760742187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,power_law_1.2,0.26042881011962893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,power_law_1.01,0.08158720135688782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,power_law_1.2,0.06424959897994995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,power_law_1.2,0.3013887882232666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,power_law_1.01,0.0996288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,power_law_1.2,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,power_law_1.2,0.3820863962173462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,power_law_1.01,0.11641600131988525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,power_law_1.2,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,power_law_1.2,0.4711616039276123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,power_law_1.01,0.1438591957092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,power_law_1.2,0.11380480527877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,power_law_1.2,0.594048023223877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,power_law_1.01,0.1561535954475403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,power_law_1.2,0.14780160188674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,power_law_1.2,0.7855360031127929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,power_law_1.01,0.16475520133972169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,power_law_1.2,0.14636160135269166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,power_law_1.2,1.0675519943237304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,power_law_1.01,0.16802560091018676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,power_law_1.2,0.15310720205307007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,power_law_1.2,1.3333696365356444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,power_law_1.01,0.16700799465179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,power_law_1.2,0.15415040254592896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,power_law_1.2,1.7042688369750976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,power_law_1.01,0.17294080257415773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,power_law_1.2,0.18098560571670533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,power_law_1.01,0.1790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,power_law_1.2,0.18199679851531983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,power_law_1.2,2.4538368225097655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,power_law_1.01,0.21205759048461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,power_law_1.2,0.1934656023979187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,power_law_1.2,5.213312149047852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,power_law_1.01,0.23070080280303956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,power_law_1.2,0.20964479446411133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,power_law_1.2,0.21886720657348632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,power_law_1.01,0.24380800724029542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,power_law_1.2,0.23749759197235107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,power_law_1.01,0.21637120246887206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,power_law_1.01,0.2413503885269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,power_law_1.2,0.24773759841918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,power_law_1.01,0.2788288116455078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,power_law_1.2,0.27859840393066404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,power_law_1.01,0.3300287961959839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,power_law_1.2,0.2833791971206665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,power_law_1.01,0.39003520011901854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,power_law_1.2,0.34009599685668945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,power_law_1.01,0.4998079776763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,power_law_1.2,0.398470401763916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,power_law_1.01,0.594816017150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,power_law_1.2,0.5088640213012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,power_law_1.01,0.7936960220336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,power_law_1.2,0.6470335960388184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,power_law_1.01,0.9984831809997559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,power_law_1.2,0.8158207893371582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,power_law_1.2,0.9833727836608886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,power_law_1.01,1.351353645324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,power_law_1.2,1.430463981628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,power_law_1.01,1.7087295532226563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,power_law_1.2,1.827564811706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,power_law_1.01,2.173017692565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,power_law_1.2,2.1665151596069334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,power_law_1.01,3.186137580871582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,power_law_1.2,3.5065280914306642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,power_law_1.01,5.99881591796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,power_law_1.2,7.073452758789062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,power_law_1.01,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,power_law_1.01,0.047865599393844604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,power_law_1.01,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,power_law_1.01,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,power_law_1.01,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,power_law_1.01,0.04357120096683502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,power_law_1.01,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,power_law_1.01,0.04787200093269348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,power_law_1.01,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,power_law_1.01,0.04910080134868622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,power_law_1.01,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,power_law_1.01,0.052985602617263795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,power_law_1.01,0.05072640180587769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,power_law_1.01,0.13672959804534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,power_law_1.01,0.055846399068832396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,power_law_1.01,0.15637120008468627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,power_law_1.01,0.2038975954055786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,power_law_1.01,0.06157439947128296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,power_law_1.01,0.21559040546417235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,power_law_1.01,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,power_law_1.01,0.21824638843536376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,power_law_1.01,0.2301248073577881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,power_law_1.01,0.10009599924087524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,power_law_1.01,0.11093759536743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,power_law_1.01,0.23790719509124755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,power_law_1.01,0.1432960033416748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,power_law_1.01,0.24814720153808595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,power_law_1.01,0.1854848027229309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,power_law_1.01,0.2516160011291504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,power_law_1.01,0.2315648078918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,power_law_1.01,0.31305599212646484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,power_law_1.01,0.2886912107467651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,power_law_1.01,0.35176959037780764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,power_law_1.01,0.41854081153869627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,power_law_1.01,0.3439807891845703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,power_law_1.01,0.5469567775726318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,power_law_1.01,0.3097791910171509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,power_law_1.2,0.06746240258216858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,power_law_1.01,0.6823232173919678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,power_law_1.01,0.36366078853607176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,power_law_1.2,0.07382400035858154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,power_law_1.01,1.2797183990478516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,power_law_1.01,0.4486400127410889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,power_law_1.2,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,power_law_1.01,0.5321856021881104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,power_law_1.2,0.09695360064506531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,power_law_1.01,2.1661056518554687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,power_law_1.01,0.6067455768585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,power_law_1.2,0.12010879516601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,power_law_1.2,0.16269439458847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,power_law_1.01,0.7613056182861329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,power_law_1.2,0.21923201084136962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,power_law_1.01,0.9726655960083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,power_law_1.2,0.23479039669036866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,power_law_1.01,1.2680447578430176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,power_law_1.2,0.24339840412139893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,power_law_1.01,1.539616012573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,power_law_1.2,0.2446079969406128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,power_law_1.01,2.1069183349609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,power_law_1.2,0.25445120334625243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,power_law_1.2,0.0546176016330719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,power_law_1.01,2.668467140197754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,power_law_1.2,0.26406400203704833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,power_law_1.01,3.249689483642578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,power_law_1.2,0.2800512075424194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,power_law_1.2,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,power_law_1.2,0.33023359775543215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,power_law_1.01,4.979814529418945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,power_law_1.2,0.3451839923858643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,power_law_1.2,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,power_law_1.2,0.36318719387054443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,power_law_1.01,9.595417785644532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,power_law_1.2,0.31875200271606446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,power_law_1.2,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,power_law_1.2,0.3793728113174438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,power_law_1.2,0.043136000633239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,power_law_1.2,0.41930880546569826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,power_law_1.2,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,power_law_1.2,0.04807040095329285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,power_law_1.2,0.5079808235168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,power_law_1.2,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,power_law_1.2,0.6168896198272705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,power_law_1.2,0.05605120062828064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,power_law_1.2,0.7670656204223633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,power_law_1.2,0.052160000801086424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,power_law_1.2,0.9964415550231933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,power_law_1.01,0.055820798873901366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,power_law_1.2,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,power_law_1.2,1.2854144096374511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,power_law_1.01,0.03740800023078918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,power_law_1.2,0.067084801197052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,power_law_1.01,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,power_law_1.2,0.06458879709243774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,power_law_1.2,1.5461183547973634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,power_law_1.2,0.07979519963264466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,power_law_1.2,2.118937683105469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,power_law_1.01,0.03800959885120392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,power_law_1.2,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,power_law_1.2,2.6893056869506835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,power_law_1.2,0.10785919427871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,power_law_1.01,0.04417920112609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,power_law_1.2,0.13162239789962768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,power_law_1.2,3.264390563964844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,power_law_1.01,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,power_law_1.2,0.17111040353775026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,power_law_1.2,4.979398345947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,power_law_1.01,0.04353919923305512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,power_law_1.2,0.20638079643249513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,power_law_1.01,0.044563201069831845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,power_law_1.2,0.27026560306549074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,power_law_1.2,9.567513275146485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,power_law_1.01,0.048876801133155824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,power_law_1.2,0.3460479974746704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,power_law_1.01,0.049702399969100954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,power_law_1.2,0.5649600028991699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,power_law_1.01,0.05256320238113403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,power_law_1.2,0.783903980255127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,power_law_1.01,0.050297600030899045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,power_law_1.2,0.955942440032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,power_law_1.01,0.058297598361968996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,power_law_1.2,2.097279930114746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,power_law_1.01,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,power_law_1.01,0.06318719983100891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,power_law_1.2,4.2929534912109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,power_law_1.01,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,power_law_1.01,0.20857601165771483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,power_law_1.01,0.08184319734573364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,power_law_1.2,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,power_law_1.01,0.21676158905029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,power_law_1.01,0.1004863977432251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,power_law_1.2,0.03715839982032776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,power_law_1.01,0.24951040744781494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,power_law_1.01,0.11256320476531982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,power_law_1.2,0.0359360009431839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,power_law_1.01,0.14881279468536376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,power_law_1.01,0.2949887990951538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,power_law_1.2,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,power_law_1.01,0.17728639841079713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,power_law_1.2,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,power_law_1.01,0.36421120166778564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,power_law_1.01,0.2454848051071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,power_law_1.2,0.04575360119342804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,power_law_1.01,0.4215551853179932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,power_law_1.01,0.288703989982605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,power_law_1.01,0.5661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,power_law_1.01,0.42816638946533203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,power_law_1.01,0.04577920138835907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,power_law_1.01,0.7478079795837402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,power_law_1.2,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,power_law_1.01,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,power_law_1.01,0.5129536151885986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,power_law_1.01,0.9964096069335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,power_law_1.01,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,power_law_1.01,0.6806719779968262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,power_law_1.2,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,power_law_1.01,1.30383358001709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,power_law_1.01,0.039468801021575926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,power_law_1.01,1.0235199928283691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,power_law_1.2,0.049446401000022885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,power_law_1.01,1.6337600708007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,power_law_1.2,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,power_law_1.01,0.042752000689506534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,power_law_1.01,2.1648576736450194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,power_law_1.01,2.401759910583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,power_law_1.2,0.051692801713943484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,power_law_1.01,0.043968001008033754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,power_law_1.01,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,power_law_1.01,4.962995147705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,power_law_1.01,0.047654399275779726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,power_law_1.01,0.04683519899845123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,power_law_1.2,0.0701312005519867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,power_law_1.01,0.04888319969177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,power_law_1.2,0.07688959836959838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,power_law_1.01,0.050323200225830075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,power_law_1.2,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,power_law_1.01,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,power_law_1.2,0.10740480422973633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,power_law_1.01,0.05314559936523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,power_law_1.2,0.11847039461135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,power_law_1.2,0.15492479801177977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,power_law_1.2,0.04805760085582733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,power_law_1.01,0.06872320175170898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,power_law_1.2,0.03699199855327606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,power_law_1.2,0.18031359910964967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,power_law_1.01,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,power_law_1.2,0.035148799419403076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,power_law_1.2,0.2689919948577881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,power_law_1.2,0.03800959885120392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,power_law_1.2,0.3367743968963623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,power_law_1.01,0.08654720187187195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,power_law_1.2,0.040678399801254275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,power_law_1.2,0.5071616172790527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,power_law_1.01,0.043296000361442565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,power_law_1.2,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,power_law_1.2,0.6075136184692382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,power_law_1.01,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,power_law_1.01,0.11932159662246704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,power_law_1.2,0.044947201013565065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,power_law_1.2,0.8153856277465821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,power_law_1.01,0.03857919871807099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,power_law_1.01,0.15803519487380982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,power_law_1.2,0.04784640073776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,power_law_1.01,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,power_law_1.2,1.588710403442383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,power_law_1.2,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,power_law_1.01,0.18814079761505126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,power_law_1.01,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,power_law_1.2,0.050297600030899045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,power_law_1.01,0.2407615900039673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,power_law_1.2,3.088057518005371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,power_law_1.01,0.05333120226860046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,power_law_1.2,0.050732797384262084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,power_law_1.01,0.30672640800476075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,power_law_1.01,0.05495679974555969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,power_law_1.2,0.052767997980117796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,power_law_1.01,0.435532808303833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,power_law_1.2,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,power_law_1.01,0.5350719928741455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,power_law_1.01,0.05825279951095581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,power_law_1.2,0.05664640069007874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,power_law_1.01,0.6831232070922851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,power_law_1.2,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,power_law_1.01,0.05822719931602478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,power_law_1.01,1.099500846862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,power_law_1.2,0.06668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,power_law_1.01,0.055174398422241214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,power_law_1.2,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,power_law_1.01,0.05578240156173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,power_law_1.01,2.161612892150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,power_law_1.2,0.07896959781646729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,power_law_1.2,0.08983680009841918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,power_law_1.01,0.06072319746017456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,power_law_1.2,0.11338880062103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,power_law_1.01,0.06685439944267273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,power_law_1.2,0.13408639430999755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,power_law_1.01,0.07258880138397217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,power_law_1.2,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,power_law_1.2,0.16049280166625976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,power_law_1.01,0.08036479949951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,power_law_1.2,0.0359360009431839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,power_law_1.2,0.19633280038833617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,power_law_1.2,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,power_law_1.01,0.09367039799690247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,power_law_1.2,0.2735424041748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,power_law_1.2,0.04249599874019623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,power_law_1.01,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,power_law_1.2,0.04516479969024658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,power_law_1.2,0.37798399925231935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,power_law_1.01,0.12499840259552002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,power_law_1.2,0.051910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,power_law_1.01,0.15161600112915039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,power_law_1.2,0.54202880859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,power_law_1.2,0.055801600217819214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,power_law_1.01,0.19299839735031127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,power_law_1.2,0.7077184200286866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,power_law_1.2,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,power_law_1.01,0.2380608081817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,power_law_1.2,1.0202303886413575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,power_law_1.2,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,power_law_1.01,0.31341440677642823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,power_law_1.2,1.3104384422302247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,power_law_1.2,0.057657599449157715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,power_law_1.01,0.3895999908447266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,power_law_1.2,0.05559679865837097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,power_law_1.2,2.3428287506103516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,power_law_1.01,0.5243775844573975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,power_law_1.01,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,power_law_1.2,0.05744640231132507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,power_law_1.01,0.03883520066738129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,power_law_1.01,0.695366382598877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,power_law_1.2,0.06111999750137329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,power_law_1.01,0.04232319891452789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,power_law_1.01,0.8100671768188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,power_law_1.2,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,power_law_1.2,0.07382400035858154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,power_law_1.01,1.2923647880554199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,power_law_1.01,0.05379199981689453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,power_law_1.2,0.07811200022697448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,power_law_1.01,0.06649600267410279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,power_law_1.01,2.6540607452392577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,power_law_1.2,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,power_law_1.2,0.09266560077667237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,power_law_1.01,0.06895359754562377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,power_law_1.2,0.11108479499816895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,power_law_1.01,0.0703935980796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,power_law_1.2,0.12912000417709352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,power_law_1.01,0.069760000705719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,power_law_1.2,0.16125439405441283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,power_law_1.01,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,power_law_1.2,0.1991487979888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,power_law_1.01,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,power_law_1.2,0.23438079357147218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,power_law_1.01,0.08799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,power_law_1.2,0.3318720102310181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,power_law_1.01,0.08615679740905761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,power_law_1.2,0.4666111946105957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,power_law_1.01,0.09721599817276001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,power_law_1.2,0.645414400100708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,power_law_1.2,0.04149760007858276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,power_law_1.01,0.10232319831848144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,power_law_1.2,0.7953023910522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,power_law_1.01,0.10847359895706177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,power_law_1.2,1.0728192329406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,power_law_1.01,0.11606400012969971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,power_law_1.01,0.14083199501037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,power_law_1.2,1.7435392379760741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,power_law_1.2,0.049702399969100954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,power_law_1.01,0.17320319414138793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,power_law_1.2,0.06239359974861145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,power_law_1.2,3.1988479614257814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,power_law_1.01,0.21087999343872071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,power_law_1.2,0.06934400200843811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,power_law_1.01,0.258790397644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,power_law_1.2,0.06894720196723939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,power_law_1.01,0.3194175958633423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,power_law_1.2,0.07117440104484558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,power_law_1.01,0.4412735939025879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,power_law_1.2,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,power_law_1.01,0.536294412612915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,power_law_1.2,0.07386879920959473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,power_law_1.01,0.7654655933380127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,power_law_1.01,0.9784768104553223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,power_law_1.2,0.08432000279426574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,power_law_1.01,1.214195156097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,power_law_1.2,0.09003520011901855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,power_law_1.01,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,power_law_1.01,1.7865983963012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,power_law_1.2,0.1019327998161316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,power_law_1.2,0.10069760084152221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,power_law_1.01,0.050271999835968015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,power_law_1.01,3.4950401306152346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,power_law_1.2,0.10887680053710938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,power_law_1.2,0.1258687973022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,power_law_1.01,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,power_law_1.2,0.139193594455719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,power_law_1.01,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,power_law_1.2,0.17953920364379883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,power_law_1.01,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,power_law_1.2,0.2051392078399658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,power_law_1.01,0.09573760032653808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,power_law_1.2,0.278054404258728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,power_law_1.01,0.09900799989700318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,power_law_1.2,0.3329279899597168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,power_law_1.01,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,power_law_1.2,0.43636479377746584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,power_law_1.01,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,power_law_1.01,0.12336000204086303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,power_law_1.2,0.5559616088867188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,power_law_1.01,0.13278720378875733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,power_law_1.2,0.8080703735351562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,power_law_1.01,0.12499840259552002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,power_law_1.2,0.9628864288330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,power_law_1.01,0.10622080564498901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,power_law_1.01,0.13623039722442626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,power_law_1.2,1.4083264350891114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,power_law_1.2,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,power_law_1.01,0.1446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,power_law_1.01,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,power_law_1.2,2.0419776916503904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,power_law_1.01,0.15081599950790406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,power_law_1.01,0.07345920205116271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,power_law_1.2,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,power_law_1.01,0.1794816017150879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,power_law_1.01,0.07959679961204529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,power_law_1.2,4.0930431365966795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,power_law_1.2,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,power_law_1.01,0.20938880443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,power_law_1.01,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,power_law_1.01,0.26467199325561525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,power_law_1.01,0.08923519849777221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,power_law_1.2,0.09164159893989562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,power_law_1.01,0.31383039951324465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,power_law_1.01,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,power_law_1.2,0.09777920246124268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,power_law_1.01,0.08698239922523499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,power_law_1.2,0.10003839731216431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,power_law_1.01,0.40558719635009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,power_law_1.2,0.1020799994468689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,power_law_1.01,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,power_law_1.01,0.49201278686523436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,power_law_1.2,0.10494719743728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,power_law_1.01,0.09147520065307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,power_law_1.01,0.6667136192321778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,power_law_1.2,0.11356159448623657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,power_law_1.01,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,power_law_1.01,0.8309632301330566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,power_law_1.2,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,power_law_1.01,0.09845759868621826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,power_law_1.01,1.1658047676086425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,power_law_1.2,0.13279999494552613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,power_law_1.01,0.10294400453567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,power_law_1.01,1.5088319778442383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,power_law_1.2,0.13219200372695922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,power_law_1.01,0.10909440517425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,power_law_1.01,1.829964828491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,power_law_1.2,0.14796160459518432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,power_law_1.01,0.11463040113449097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,power_law_1.2,0.07325440049171447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,power_law_1.2,0.15389440059661866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,power_law_1.01,0.11973760128021241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,power_law_1.01,2.8312320709228516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,power_law_1.2,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,power_law_1.2,0.14673279523849486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,power_law_1.01,0.13941119909286498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,power_law_1.2,0.06798080205917359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,power_law_1.01,5.5263935089111325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,power_law_1.2,0.17786240577697754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,power_law_1.01,0.1543552041053772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,power_law_1.2,0.08141440153121948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,power_law_1.2,0.20611839294433593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,power_law_1.01,0.1875264048576355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,power_law_1.2,0.09066240191459655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,power_law_1.2,0.2558784008026123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,power_law_1.01,0.21660799980163575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,power_law_1.2,0.08756480216979981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,power_law_1.2,0.32204160690307615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,power_law_1.01,0.2782464027404785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,power_law_1.2,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,power_law_1.2,0.4099135875701904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,power_law_1.01,0.3321151971817017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,power_law_1.2,0.0896127998828888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,power_law_1.2,0.49733757972717285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,power_law_1.01,0.42981758117675783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,power_law_1.2,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,power_law_1.2,0.6699776172637939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,power_law_1.01,0.5690688133239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,power_law_1.2,0.09658240079879761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,power_law_1.2,0.8346367835998535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,power_law_1.01,0.8662400245666504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,power_law_1.2,0.09536640048027038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,power_law_1.2,1.1690815925598144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,power_law_1.01,1.1040063858032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,power_law_1.2,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,power_law_1.2,1.503104019165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,power_law_1.01,1.3096192359924317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,power_law_1.2,0.10683519840240478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,power_law_1.01,0.09797120094299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,power_law_1.2,1.8373376846313476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,power_law_1.01,2.0096256256103517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,power_law_1.2,0.11564160585403442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,power_law_1.01,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,power_law_1.2,2.834931182861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,power_law_1.2,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,power_law_1.01,0.057017600536346434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,power_law_1.01,4.4930366516113285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,power_law_1.2,0.12280960083007812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,power_law_1.01,0.07217919826507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,power_law_1.2,5.539923095703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,power_law_1.2,0.15005439519882202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,power_law_1.01,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,power_law_1.2,0.16499840021133422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,power_law_1.2,0.19359359741210938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,power_law_1.01,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,power_law_1.2,0.22677760124206542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,power_law_1.2,0.31573119163513186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,power_law_1.01,0.09040639996528625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,power_law_1.2,0.33292160034179685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,power_law_1.01,0.09409279823303222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,power_law_1.2,0.5485824108123779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,power_law_1.01,0.09757440090179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,power_law_1.2,0.6271552085876465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,power_law_1.01,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,power_law_1.2,0.9792767524719238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,power_law_1.01,0.10186879634857178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,power_law_1.2,1.2846400260925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,power_law_1.01,0.10453120470046998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,power_law_1.2,1.8791488647460937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,power_law_1.2,0.06503679752349853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,power_law_1.01,0.11354240179061889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,power_law_1.01,0.07730559706687927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,power_law_1.2,3.1200639724731447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,power_law_1.01,0.11599999666213989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,power_law_1.01,0.0705344021320343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,power_law_1.2,0.06343039870262146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,power_law_1.01,0.11845760345458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,power_law_1.01,0.05948160290718078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,power_law_1.2,0.07058560252189636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,power_law_1.2,6.743571472167969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,power_law_1.01,0.13340799808502196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,power_law_1.01,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,power_law_1.2,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,power_law_1.01,0.15409280061721803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,power_law_1.01,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,power_law_1.2,0.08923519849777221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,power_law_1.01,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,power_law_1.01,0.20366079807281495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,power_law_1.01,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,power_law_1.2,0.09045119881629944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,power_law_1.01,0.2599744081497192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,power_law_1.01,0.09123200178146362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,power_law_1.2,0.09147520065307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,power_law_1.01,0.0946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,power_law_1.2,0.09660159945487976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,power_law_1.01,0.2972480058670044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,power_law_1.01,0.09841279983520508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,power_law_1.2,0.09884160161018371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,power_law_1.01,0.3887936115264893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,power_law_1.01,0.09901440143585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,power_law_1.2,0.09966080188751221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,power_law_1.01,0.5010111808776856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,power_law_1.01,0.10412800312042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,power_law_1.2,0.10499839782714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,power_law_1.01,0.7150400161743165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,power_law_1.01,0.10720000267028809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,power_law_1.2,0.11155200004577637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,power_law_1.01,0.913696002960205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,power_law_1.01,0.11265280246734619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,power_law_1.2,0.11707520484924316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,power_law_1.2,0.07836160063743591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,power_law_1.01,1.2071680068969726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,power_law_1.01,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,power_law_1.2,0.12446719408035278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,power_law_1.01,1.9047168731689452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,power_law_1.01,0.12541439533233642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,power_law_1.2,0.1406399965286255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,power_law_1.2,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,power_law_1.01,0.12602880001068115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,power_law_1.2,0.15947519540786742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,power_law_1.01,3.5506881713867187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,power_law_1.01,0.1401535987854004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,power_law_1.2,0.18792959451675414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,power_law_1.2,0.06977279782295227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,power_law_1.01,0.15676159858703614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,power_law_1.2,0.22357759475708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,power_law_1.01,0.19465600252151488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,power_law_1.2,0.28010880947113037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,power_law_1.2,0.08777599930763244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,power_law_1.01,0.2142848014831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,power_law_1.2,0.3310784101486206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,power_law_1.2,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,power_law_1.01,0.2669503927230835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,power_law_1.2,0.4818431854248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,power_law_1.2,0.09740800261497498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,power_law_1.01,0.35704960823059084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,power_law_1.2,0.7003392219543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,power_law_1.2,0.10354559421539307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,power_law_1.01,0.45474557876586913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,power_law_1.2,0.9349504470825195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,power_law_1.2,0.10520319938659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,power_law_1.01,0.5706495761871337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,power_law_1.2,1.0623295783996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,power_law_1.2,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,power_law_1.01,0.7822080135345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,power_law_1.2,1.5149824142456054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,power_law_1.2,0.10639359951019287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,power_law_1.01,0.9771648406982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,power_law_1.2,2.5001216888427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,power_law_1.2,0.11871999502182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,power_law_1.01,1.2915519714355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,power_law_1.2,0.12198400497436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,power_law_1.2,5.27496337890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,power_law_1.2,0.12855039834976195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,power_law_1.01,1.867647933959961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,power_law_1.01,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,power_law_1.2,0.14370559453964232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,power_law_1.01,3.6627262115478514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,power_law_1.01,0.06277120113372803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,power_law_1.2,0.1742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,power_law_1.2,0.2024768114089966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,power_law_1.01,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,power_law_1.2,0.23075199127197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,power_law_1.01,0.0693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,power_law_1.01,0.07600640058517456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,power_law_1.2,0.2899264097213745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,power_law_1.01,0.09707520008087159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,power_law_1.2,0.3708224058151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,power_law_1.01,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,power_law_1.2,0.5162303924560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,power_law_1.01,0.10453120470046998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,power_law_1.2,0.5707136154174804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,power_law_1.01,0.10616320371627808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,power_law_1.2,0.8223872184753418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,power_law_1.01,0.10739840269088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,power_law_1.2,1.2359040260314942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,power_law_1.01,0.11641600131988525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,power_law_1.2,1.5502528190612792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,power_law_1.01,0.12090879678726196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,power_law_1.2,2.324812889099121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,power_law_1.01,0.12316800355911255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,power_law_1.2,0.0648576021194458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,power_law_1.01,0.12316160202026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,power_law_1.2,0.05440000295639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,power_law_1.2,4.208153533935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,power_law_1.01,0.1327936053276062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,power_law_1.2,0.058303999900817874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,power_law_1.01,0.13749120235443116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,power_law_1.01,0.13935359716415405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,power_law_1.2,0.07326080203056336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,power_law_1.01,0.1602112054824829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,power_law_1.2,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,power_law_1.2,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,power_law_1.01,0.1758015990257263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,power_law_1.2,0.10274560451507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,power_law_1.01,0.21471359729766845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,power_law_1.2,0.10602240562438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,power_law_1.01,0.24686079025268554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,power_law_1.01,0.063372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,power_law_1.2,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,power_law_1.01,0.06440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,power_law_1.01,0.31198079586029054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,power_law_1.2,0.11667200326919555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,power_law_1.01,0.06295040249824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,power_law_1.01,0.3943295955657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,power_law_1.2,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,power_law_1.01,0.0785152018070221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,power_law_1.01,0.5145408153533936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,power_law_1.2,0.12343039512634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,power_law_1.01,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,power_law_1.01,0.6552256107330322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,power_law_1.2,0.1221951961517334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,power_law_1.01,0.11353600025177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,power_law_1.01,0.8981247901916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,power_law_1.2,0.13571200370788575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,power_law_1.01,0.12008960247039795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,power_law_1.01,1.1096768379211426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,power_law_1.2,0.14288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,power_law_1.01,0.12255359888076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,power_law_1.01,1.4598976135253907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,power_law_1.2,0.14615679979324342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,power_law_1.01,0.12973439693450928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,power_law_1.2,0.15864319801330568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,power_law_1.01,0.13526400327682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,power_law_1.01,2.2811391830444334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,power_law_1.2,0.19489920139312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,power_law_1.01,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,power_law_1.01,4.132332611083984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,power_law_1.2,0.2231679916381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,power_law_1.01,0.14960000514984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,power_law_1.01,0.1571776032447815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,power_law_1.2,0.2544895887374878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,power_law_1.01,0.1590016007423401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,power_law_1.2,0.3325056076049805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,power_law_1.2,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,power_law_1.01,0.1672127962112427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,power_law_1.2,0.4115776062011719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,power_law_1.2,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,power_law_1.01,0.18216320276260375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,power_law_1.2,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,power_law_1.2,0.5285312175750733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,power_law_1.01,0.17663359642028809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,power_law_1.2,0.08102399706840516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,power_law_1.2,0.7024064064025879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,power_law_1.01,0.21063039302825928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,power_law_1.2,0.11521919965744018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,power_law_1.2,1.0720576286315917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,power_law_1.01,0.2329472064971924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,power_law_1.2,0.12300800085067749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,power_law_1.2,1.264140796661377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,power_law_1.01,0.2827071905136108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,power_law_1.2,0.12403199672698975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,power_law_1.2,1.7263744354248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,power_law_1.2,0.1277184009552002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,power_law_1.01,0.32568960189819335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,power_law_1.2,2.5984384536743166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,power_law_1.2,0.13918720483779906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,power_law_1.01,0.40189437866210936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,power_law_1.2,0.13752959966659545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,power_law_1.01,0.5415679931640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,power_law_1.2,5.05030403137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,power_law_1.2,0.136518394947052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,power_law_1.01,0.6966015815734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,power_law_1.2,0.14369920492172242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,power_law_1.01,0.8739583969116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,power_law_1.2,0.15230079889297485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,power_law_1.01,1.196127986907959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,power_law_1.2,0.16049280166625976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,power_law_1.01,1.5141632080078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,power_law_1.2,0.16868480443954467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,power_law_1.01,1.9203008651733398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,power_law_1.2,0.17994879484176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,power_law_1.2,0.21374080181121827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,power_law_1.01,2.9930240631103517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,power_law_1.2,0.23196160793304443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,power_law_1.2,0.2783936023712158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,power_law_1.01,5.688800048828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,power_law_1.2,0.33041279315948485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,power_law_1.2,0.4506944179534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,power_law_1.2,0.519923210144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,power_law_1.2,0.7113984107971192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,power_law_1.2,0.8744319915771485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,power_law_1.2,1.2124159812927247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,power_law_1.2,1.5297151565551759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,power_law_1.2,1.9969024658203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,power_law_1.2,3.135148811340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,power_law_1.2,6.156768035888672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,power_law_1.01,0.06663680076599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,power_law_1.01,0.11007360219955445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,power_law_1.01,0.07649279832839966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,power_law_1.01,0.13729920387268066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,power_law_1.01,0.09633280038833618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,power_law_1.01,0.13198720216751098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,power_law_1.01,0.10657919645309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,power_law_1.01,0.07670400142669678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,power_law_1.01,0.15082240104675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,power_law_1.01,0.0906175971031189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,power_law_1.01,0.158188796043396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,power_law_1.01,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,power_law_1.01,0.16760319471359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,power_law_1.01,0.17785600423812867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,power_law_1.01,0.10652799606323242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,power_law_1.01,0.18624000549316405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,power_law_1.01,0.11273599863052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,power_law_1.01,0.2079551935195923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,power_law_1.01,0.11683199405670167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,power_law_1.01,0.22083840370178223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,power_law_1.01,0.11725440025329589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,power_law_1.2,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,power_law_1.01,0.22556800842285157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,power_law_1.2,0.05911679863929749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,power_law_1.01,0.12400000095367432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,power_law_1.2,0.1363136053085327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,power_law_1.01,0.1979200005531311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,power_law_1.2,0.0648576021194458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,power_law_1.01,0.13155839443206788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,power_law_1.01,0.217574405670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,power_law_1.2,0.07223039865493774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,power_law_1.2,0.12524800300598143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,power_law_1.01,0.225164794921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,power_law_1.2,0.09045119881629944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,power_law_1.01,0.1319808006286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,power_law_1.01,0.2466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,power_law_1.2,0.10540159940719604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,power_law_1.01,0.1418176054954529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,power_law_1.2,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,power_law_1.2,0.15005439519882202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,power_law_1.01,0.29397120475769045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,power_law_1.01,0.1524672031402588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,power_law_1.2,0.10110080242156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,power_law_1.2,0.15926400423049927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,power_law_1.01,0.326911997795105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,power_law_1.01,0.1536960005760193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,power_law_1.2,0.1035647988319397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,power_law_1.2,0.17340799570083618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,power_law_1.01,0.4037439823150635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,power_law_1.01,0.16393599510192872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,power_law_1.2,0.18261120319366456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,power_law_1.2,0.11541759967803955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,power_law_1.01,0.485427188873291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,power_law_1.2,0.19325439929962157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,power_law_1.01,0.1954751968383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,power_law_1.01,0.6267648220062256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,power_law_1.2,0.12136319875717164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,power_law_1.2,0.20801920890808107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,power_law_1.01,0.19303040504455565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,power_law_1.01,0.7936768054962158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,power_law_1.2,0.1252671957015991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,power_law_1.2,0.22685439586639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,power_law_1.01,1.0328960418701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,power_law_1.01,0.22167038917541504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,power_law_1.2,0.1250432014465332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,power_law_1.2,0.22931840419769287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,power_law_1.01,1.2600128173828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,power_law_1.01,0.24380800724029542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,power_law_1.2,0.21088640689849852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,power_law_1.2,0.12772480249404908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,power_law_1.01,1.7550016403198243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,power_law_1.2,0.22235519886016847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,power_law_1.01,0.3222208023071289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,power_law_1.2,0.12955520153045655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,power_law_1.2,0.23135359287261964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,power_law_1.01,2.269286346435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,power_law_1.01,0.3881727933883667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,power_law_1.2,0.13078399896621704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,power_law_1.2,0.25019519329071044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,power_law_1.01,2.772659111022949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,power_law_1.01,0.5260223865509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,power_law_1.2,0.1525056004524231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,power_law_1.2,0.2983232021331787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,power_law_1.01,0.6128575801849365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,power_law_1.2,0.15147520303726197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,power_law_1.2,0.325766396522522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,power_law_1.01,4.276505661010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,power_law_1.2,0.405836820602417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,power_law_1.2,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,power_law_1.01,0.8493696212768554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,power_law_1.01,8.347071838378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,power_law_1.2,0.48427519798278806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,power_law_1.2,0.187116801738739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,power_law_1.01,1.1158464431762696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,power_law_1.2,0.6264063835144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,power_law_1.2,0.19939839839935303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,power_law_1.01,1.3120256423950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,power_law_1.2,0.7941247940063476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,power_law_1.2,0.2407680034637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,power_law_1.2,1.0444160461425782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,power_law_1.01,1.9960575103759766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,power_law_1.2,0.27825279235839845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,power_law_1.2,1.2711168289184571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,power_law_1.01,4.022521591186523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,power_law_1.2,0.36664319038391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,power_law_1.2,1.7624448776245116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,power_law_1.2,2.2766847610473633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,power_law_1.2,0.3931391954421997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,power_law_1.2,2.798931121826172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,power_law_1.2,0.5370240211486816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,power_law_1.2,0.6868351936340332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,power_law_1.2,4.294169616699219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,power_law_1.2,0.9522047996520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,power_law_1.2,8.365593719482423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,power_law_1.01,0.0967423975467682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,power_law_1.2,1.2801024436950683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,power_law_1.01,0.11415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,power_law_1.2,1.6247808456420898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,power_law_1.01,0.14036480188369752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,power_law_1.2,2.4874240875244142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,power_law_1.01,0.06725760102272034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,power_law_1.01,0.0840511977672577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,power_law_1.2,5.3216510772705075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,power_law_1.2,0.09573760032653808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,power_law_1.01,0.09408640265464782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,power_law_1.2,0.11478400230407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,power_law_1.01,0.10615040063858032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,power_law_1.2,0.09123200178146362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,power_law_1.01,0.12337919473648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,power_law_1.2,0.07197440266609192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,power_law_1.01,0.11886719465255738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,power_law_1.2,0.08181120157241821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,power_law_1.2,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,power_law_1.01,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,power_law_1.2,0.10085760354995728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,power_law_1.01,0.12521599531173705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,power_law_1.01,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,power_law_1.2,0.11724159717559815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,power_law_1.01,0.0908735990524292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,power_law_1.01,0.13033599853515626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,power_law_1.2,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,power_law_1.01,0.12199679613113404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,power_law_1.01,0.13034240007400513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,power_law_1.01,0.06812800168991089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,power_law_1.2,0.11929600238800049
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,power_law_1.01,0.1395583987236023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,power_law_1.2,0.1268671989440918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,power_law_1.01,0.14527360200881959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,power_law_1.2,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,power_law_1.01,0.096806401014328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,power_law_1.2,0.12113280296325683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,power_law_1.01,0.14057600498199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,power_law_1.2,0.09188479781150818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,power_law_1.01,0.10764800310134888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,power_law_1.2,0.13239680528640746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,power_law_1.01,0.15306880474090576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,power_law_1.2,0.07445120215415954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,power_law_1.01,0.12199679613113404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,power_law_1.2,0.1332159996032715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,power_law_1.01,0.17538559436798096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,power_law_1.2,0.0673088014125824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,power_law_1.01,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,power_law_1.2,0.14611200094223023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,power_law_1.01,0.18645119667053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,power_law_1.2,0.07712640166282654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,power_law_1.01,0.12874879837036132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,power_law_1.2,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,power_law_1.01,0.21573760509490966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,power_law_1.01,0.12383359670639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,power_law_1.2,0.16046080589294434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,power_law_1.01,0.2544384002685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,power_law_1.2,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,power_law_1.01,0.13407360315322875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,power_law_1.2,0.18297599554061889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,power_law_1.01,0.31546878814697266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,power_law_1.2,0.19445120096206664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,power_law_1.01,0.14022400379180908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,power_law_1.2,0.11912959814071655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,power_law_1.01,0.38224639892578127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,power_law_1.2,0.24688000679016114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,power_law_1.01,0.14451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,power_law_1.2,0.11971839666366577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,power_law_1.01,0.5141312122344971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,power_law_1.01,0.151910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,power_law_1.2,0.2677695989608765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,power_law_1.2,0.1211583971977234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,power_law_1.01,0.6103936195373535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,power_law_1.01,0.15763200521469117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,power_law_1.2,0.32613120079040525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,power_law_1.2,0.1312000036239624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,power_law_1.01,0.8559488296508789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,power_law_1.01,0.163372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,power_law_1.2,0.40064001083374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,power_law_1.2,0.13304320573806763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,power_law_1.01,1.0851136207580567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,power_law_1.2,0.5137216091156006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,power_law_1.01,0.1891584038734436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,power_law_1.2,0.13980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,power_law_1.01,1.3116095542907715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,power_law_1.01,0.20166399478912353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,power_law_1.2,0.6720320224761963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,power_law_1.2,0.1465664029121399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,power_law_1.01,1.9251903533935546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,power_law_1.01,0.24158720970153807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,power_law_1.2,0.9472960472106934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,power_law_1.2,0.15086719989776612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,power_law_1.01,0.26187520027160643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,power_law_1.2,0.15741440057754516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,power_law_1.01,4.0348350524902346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,power_law_1.2,1.1920127868652344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,power_law_1.01,0.3464639902114868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,power_law_1.2,0.16725120544433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,power_law_1.2,1.420582389831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,power_law_1.01,0.40830078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,power_law_1.2,0.19448959827423096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,power_law_1.2,2.2328128814697266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,power_law_1.01,0.5428671836853027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,power_law_1.2,0.20760319232940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,power_law_1.01,0.6786431789398193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,power_law_1.2,4.812652969360352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,power_law_1.2,0.24807679653167725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,power_law_1.01,0.8895744323730469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,power_law_1.2,0.285427188873291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,power_law_1.01,1.1838848114013671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,power_law_1.2,0.34971520900726316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,power_law_1.2,0.43104000091552735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,power_law_1.01,1.4374272346496582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,power_law_1.2,0.5944575786590576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,power_law_1.01,2.211993598937988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,power_law_1.2,0.7621888160705567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,power_law_1.01,4.247884750366211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,power_law_1.2,0.9775744438171386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,power_law_1.2,1.2886719703674316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,power_law_1.2,1.497817611694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,power_law_1.2,2.5115711212158205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,power_law_1.01,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,power_law_1.2,4.6662849426269535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,power_law_1.01,0.07463679909706115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,power_law_1.01,0.088755202293396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,power_law_1.2,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,power_law_1.2,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,power_law_1.01,0.11107840538024902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,power_law_1.2,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,power_law_1.01,0.1194815993309021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,power_law_1.2,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,power_law_1.01,0.1344256043434143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,power_law_1.2,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,power_law_1.01,0.14309760332107543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,power_law_1.2,0.10230400562286376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,power_law_1.01,0.15083520412445067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,power_law_1.2,0.1139456033706665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,power_law_1.01,0.15081599950790406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,power_law_1.2,0.13567999601364136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,power_law_1.01,0.1545024037361145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,power_law_1.2,0.14058239459991456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,power_law_1.01,0.15982719659805297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,power_law_1.2,0.14202239513397216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,power_law_1.01,0.16842880249023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,power_law_1.2,0.15408639907836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,power_law_1.01,0.17969919443130494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,power_law_1.2,0.15820159912109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,power_law_1.01,0.18542720079421998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,power_law_1.2,0.16268800497055053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,power_law_1.01,0.19544960260391236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,power_law_1.01,0.07059199810028076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,power_law_1.2,0.16844160556793214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,power_law_1.01,0.21552000045776368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,power_law_1.01,0.08469759821891784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,power_law_1.2,0.17662080526351928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,power_law_1.01,0.2395008087158203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,power_law_1.2,0.1866688013076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,power_law_1.01,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,power_law_1.01,0.28782079219818113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,power_law_1.2,0.19957120418548585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,power_law_1.01,0.12874239683151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,power_law_1.01,0.32222719192504884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,power_law_1.2,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,power_law_1.2,0.22230401039123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,power_law_1.01,0.14370559453964232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,power_law_1.01,0.4060031890869141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,power_law_1.2,0.07262719869613647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,power_law_1.2,0.24483199119567872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,power_law_1.01,0.18176640272140504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,power_law_1.01,0.4830016136169434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,power_law_1.2,0.08102399706840516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,power_law_1.2,0.2935551881790161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,power_law_1.01,0.1934399962425232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,power_law_1.01,0.6372159957885742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,power_law_1.2,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,power_law_1.01,0.19203200340270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,power_law_1.2,0.3367743968963623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,power_law_1.2,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,power_law_1.01,0.805561637878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,power_law_1.01,0.19304959774017333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,power_law_1.2,0.4301760196685791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,power_law_1.2,0.12034560441970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,power_law_1.01,1.096992015838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,power_law_1.01,0.2030911922454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,power_law_1.2,0.5280704021453857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,power_law_1.2,0.14206080436706542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,power_law_1.01,1.4209856033325194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,power_law_1.01,0.2096384048461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,power_law_1.2,0.6728511810302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,power_law_1.2,0.1694975972175598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,power_law_1.01,1.698080062866211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,power_law_1.01,0.21619200706481934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,power_law_1.2,0.8600383758544922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,power_law_1.2,0.18487679958343506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,power_law_1.01,2.605721664428711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,power_law_1.01,0.23094398975372316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,power_law_1.2,0.19797120094299317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,power_law_1.2,1.1936575889587402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,power_law_1.01,0.2381119966506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,power_law_1.2,0.1965440034866333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,power_law_1.2,1.4792896270751954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,power_law_1.01,4.90975341796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,power_law_1.01,0.2563456058502197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,power_law_1.2,0.21944959163665773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,power_law_1.2,1.7955583572387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,power_law_1.01,0.2856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,power_law_1.2,0.23379840850830078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,power_law_1.2,2.741535949707031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,power_law_1.01,0.31655681133270264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,power_law_1.2,0.24855680465698243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,power_law_1.01,0.38699519634246826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,power_law_1.2,0.2641216039657593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,power_law_1.2,5.508383941650391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,power_law_1.01,0.4318592071533203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,power_law_1.2,0.27497599124908445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,power_law_1.01,0.5473728179931641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,power_law_1.2,0.25715200901031493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,power_law_1.01,0.6745535850524902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,power_law_1.2,0.28501119613647463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,power_law_1.01,0.871987247467041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,power_law_1.2,0.32515840530395507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,power_law_1.01,1.1105536460876464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,power_law_1.2,0.385318398475647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,power_law_1.2,0.44167680740356446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,power_law_1.01,1.5108736038208008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,power_law_1.2,0.5522687911987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,power_law_1.01,1.8861375808715821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,power_law_1.2,0.7019775867462158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,power_law_1.01,2.2566400527954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,power_law_1.2,0.885478401184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,power_law_1.01,3.427872085571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,power_law_1.2,1.1260671615600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,power_law_1.01,7.083757019042968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,power_law_1.2,1.5604351997375487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,power_law_1.2,1.9661056518554687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,power_law_1.2,2.335865592956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,8,power_law_1.01,0.020006400346755982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,8,power_law_1.01,0.019174399971961974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,power_law_1.2,3.549113464355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,8,power_law_1.01,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,8,power_law_1.01,0.019603200256824493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,power_law_1.2,6.708351898193359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,8,power_law_1.01,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,8,power_law_1.01,0.023078399896621703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,8,power_law_1.01,0.022681599855422972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,8,power_law_1.01,0.025740799307823182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,8,power_law_1.01,0.024512000381946564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,4,8,power_law_1.2,0.019174399971961974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,8,power_law_1.01,0.0253248006105423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,4,8,power_law_1.2,0.019776000082492827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,8,power_law_1.01,0.027993598580360414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,4,8,power_law_1.2,0.01958400011062622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,8,power_law_1.01,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,4,8,power_law_1.2,0.019993600249290467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,8,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,4,8,power_law_1.2,0.020608000457286835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,8,power_law_1.01,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,4,8,power_law_1.2,0.024294400215148927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,8,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,4,8,power_law_1.2,0.02428800016641617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,8,power_law_1.01,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,4,8,power_law_1.2,0.026144000887870788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,8,power_law_1.01,0.05011199712753296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,4,8,power_law_1.2,0.024505600333213806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,8,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,4,8,power_law_1.2,0.026150399446487428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,8,power_law_1.01,0.07283200025558471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,4,8,power_law_1.2,0.027775999903678895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,power_law_1.01,0.06909440159797668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,8,power_law_1.01,0.1078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,4,8,power_law_1.2,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,8,power_law_1.01,0.1285375952720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,power_law_1.01,0.07668480277061462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,4,8,power_law_1.2,0.03821440041065216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,8,power_law_1.01,0.2061568021774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,4,8,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,power_law_1.01,0.08691840171813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,8,power_law_1.01,0.2571647882461548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,4,8,power_law_1.2,0.040678399801254275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,8,power_law_1.01,0.3857728004455566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,power_law_1.01,0.09941120147705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,4,8,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,8,power_law_1.01,0.4160768032073975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,power_law_1.2,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,4,8,power_law_1.2,0.04907520115375519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,power_law_1.01,0.13852159976959227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,8,power_law_1.01,0.7195968151092529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,4,8,power_law_1.2,0.06543999910354614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,power_law_1.2,0.07566720247268677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,power_law_1.01,0.17744640111923218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,8,power_law_1.01,1.0132800102233888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,4,8,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,power_law_1.2,0.08447359800338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,8,power_law_1.01,1.1736255645751954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,4,8,power_law_1.2,0.11072640419006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,power_law_1.01,0.20775680541992186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,power_law_1.2,0.10658559799194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,4,8,power_law_1.2,0.14307839870452882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,8,power_law_1.01,1.9199232101440429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,power_law_1.01,0.25321600437164304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,4,8,power_law_1.2,0.19857280254364013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,power_law_1.2,0.12707200050354003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,8,power_law_1.01,3.871673583984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,power_law_1.01,0.26528639793395997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,4,8,power_law_1.2,0.26165759563446045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,power_law_1.2,0.17375999689102173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,4,8,power_law_1.2,0.3882240056991577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,power_law_1.01,0.2798271894454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,power_law_1.2,0.19753600358963014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,4,8,power_law_1.2,0.5178624153137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,8,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,power_law_1.01,0.3111743927001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,4,8,power_law_1.2,0.7212287902832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,8,power_law_1.01,0.04069119989871979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,power_law_1.2,0.26407039165496826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,power_law_1.01,0.3392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,4,8,power_law_1.2,1.0120320320129395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,8,power_law_1.01,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,power_law_1.2,0.26857600212097166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,4,8,power_law_1.2,1.2190848350524903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,8,power_law_1.01,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,power_law_1.01,0.3334719896316528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,power_law_1.2,0.2935551881790161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,8,power_law_1.01,0.039052799344062805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,4,8,power_law_1.2,1.9977472305297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,power_law_1.01,0.3480384111404419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,8,power_law_1.01,0.039673599600791934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,power_law_1.2,0.27882239818572996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,4,8,power_law_1.2,3.8933761596679686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,8,power_law_1.01,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,power_law_1.01,0.3928832054138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,power_law_1.2,0.29602560997009275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,8,power_law_1.01,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,power_law_1.01,0.4432703971862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,8,power_law_1.01,0.03985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,power_law_1.2,0.31240320205688477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,4,8,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,power_law_1.01,0.4797247886657715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,8,power_law_1.01,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,power_law_1.2,0.32614400386810305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,4,8,power_law_1.2,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,8,power_law_1.01,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,power_law_1.01,0.5628672122955323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,4,8,power_law_1.2,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,power_law_1.2,0.3390271902084351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,8,power_law_1.01,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,4,8,power_law_1.2,0.03841919898986816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,8,power_law_1.01,0.04601599872112274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,power_law_1.01,0.4805312156677246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,power_law_1.2,0.35011839866638184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,4,8,power_law_1.2,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,8,power_law_1.01,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,power_law_1.01,0.5808896064758301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,power_law_1.2,0.37569921016693114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,4,8,power_law_1.2,0.038822400569915774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,8,power_law_1.01,0.053388798236846925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,4,8,power_law_1.2,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,8,power_law_1.01,0.0581055998802185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,power_law_1.2,0.4432703971862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,power_law_1.01,0.6679232120513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,4,8,power_law_1.2,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,8,power_law_1.01,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,power_law_1.2,0.48874239921569823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,power_law_1.01,0.8440640449523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,4,8,power_law_1.2,0.042508798837661746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,8,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,power_law_1.2,0.5948224067687988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,8,power_law_1.01,0.07305600047111512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,4,8,power_law_1.2,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,power_law_1.01,1.0369728088378907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,8,power_law_1.01,0.0877951979637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,4,8,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,power_law_1.2,0.6712255954742432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,power_law_1.01,1.3370047569274903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,8,power_law_1.01,0.10806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,4,8,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,power_law_1.2,0.8491968154907227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,4,8,power_law_1.2,0.04560000002384186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,8,power_law_1.01,0.14431359767913818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,power_law_1.01,1.7382080078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,4,8,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,8,power_law_1.01,0.1637760043144226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,power_law_1.2,1.0545984268188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,power_law_1.01,2.340345573425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,4,8,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,8,power_law_1.01,0.23748478889465333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,power_law_1.2,1.3648703575134278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,4,8,power_law_1.2,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,8,power_law_1.01,0.2749696016311646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,power_law_1.01,2.8734079360961915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,4,8,power_law_1.2,0.06117119789123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,8,power_law_1.01,0.4429056167602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,power_law_1.2,1.788198471069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,4,8,power_law_1.2,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,power_law_1.01,3.4708160400390624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,8,power_law_1.01,0.5436736106872558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,power_law_1.2,2.379238319396973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,4,8,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,8,power_law_1.01,0.7044352054595947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,4,8,power_law_1.2,0.08962560296058655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,power_law_1.01,5.369120025634766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,power_law_1.2,2.8807872772216796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,8,power_law_1.01,1.1011391639709474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,4,8,power_law_1.2,0.10885119438171387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,8,power_law_1.01,2.471455955505371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,power_law_1.2,3.5109630584716798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,4,8,power_law_1.2,0.14163199663162232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,power_law_1.01,10.184166717529298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,4,8,power_law_1.2,0.17032320499420167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,power_law_1.2,5.3957374572753904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,4,8,power_law_1.2,0.24158079624176027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,4,8,power_law_1.2,0.26370561122894287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,4,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,4,8,power_law_1.2,0.4392127990722656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,4,power_law_1.2,0.019334399700164796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,power_law_1.2,10.196466827392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,4,power_law_1.01,0.019392000138759614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,4,8,power_law_1.2,0.5563648223876954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,4,power_law_1.2,0.018918399512767792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,4,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,4,8,power_law_1.2,0.6716671943664551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,4,power_law_1.2,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,4,power_law_1.01,0.01897599995136261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,4,power_law_1.2,0.01913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,4,power_law_1.01,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,4,8,power_law_1.2,1.1019455909729003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,4,power_law_1.01,0.04371199905872345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,4,power_law_1.2,0.020127999782562255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,4,power_law_1.01,0.02184319943189621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,4,power_law_1.01,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,4,8,power_law_1.2,2.4460479736328127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,4,power_law_1.2,0.02383359968662262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,4,power_law_1.01,0.0216511994600296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,4,power_law_1.01,0.03961600065231323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,4,power_law_1.2,0.02096640020608902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,4,power_law_1.01,0.023680000007152556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,4,power_law_1.01,0.03920640051364899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,4,power_law_1.01,0.022668799757957457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,4,power_law_1.2,0.024249599874019624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,4,power_law_1.01,0.04127359986305237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,4,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,4,power_law_1.01,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,4,power_law_1.01,0.023686400055885314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,4,power_law_1.2,0.02343039959669113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,4,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,4,power_law_1.01,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,4,power_law_1.01,0.02573440074920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,4,power_law_1.2,0.024249599874019624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,4,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,4,power_law_1.01,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,4,power_law_1.01,0.029420799016952513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,4,power_law_1.2,0.030771198868751525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,4,power_law_1.2,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,4,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,4,power_law_1.01,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,4,power_law_1.2,0.02937600016593933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,4,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,4,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,4,power_law_1.01,0.03250559866428375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,4,power_law_1.2,0.028339201211929323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,4,power_law_1.2,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,4,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,4,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,4,power_law_1.2,0.0344895988702774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,4,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,4,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,4,power_law_1.01,0.03783040046691895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,4,power_law_1.2,0.03815680146217346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,4,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,4,power_law_1.01,0.044121599197387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,4,power_law_1.01,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,4,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,4,power_law_1.2,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,4,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,4,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,4,power_law_1.2,0.04429439902305603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,4,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,4,power_law_1.01,0.052908802032470705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,4,power_law_1.01,0.05726079940795899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,4,power_law_1.2,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,4,power_law_1.2,0.0404992014169693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,4,power_law_1.01,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,4,power_law_1.01,0.07591040134429931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,4,power_law_1.2,0.06377599835395813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,4,power_law_1.01,0.059494400024414064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,4,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,4,power_law_1.01,0.10703359842300415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,4,power_law_1.2,0.09080320000648498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,4,power_law_1.01,0.06829439997673034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,4,power_law_1.2,0.04273279905319214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,4,power_law_1.01,0.146560001373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,4,power_law_1.2,0.10513919591903687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,4,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,4,power_law_1.2,0.045772799849510194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,4,power_law_1.01,0.18138240575790404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,4,power_law_1.2,0.17375359535217286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,4,power_law_1.01,0.091430401802063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,4,power_law_1.2,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,4,power_law_1.01,0.2760063886642456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,4,power_law_1.2,0.2112191915512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,4,power_law_1.01,0.10243200063705445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,4,power_law_1.2,0.05605120062828064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,4,power_law_1.01,0.3579200029373169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,4,power_law_1.2,0.29948160648345945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,4,power_law_1.01,0.12747520208358765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,4,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,4,power_law_1.01,0.5772607803344727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,4,power_law_1.2,0.4395711898803711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,4,power_law_1.01,0.16168320178985596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,4,power_law_1.2,0.07098879814147949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,4,power_law_1.01,0.7224639892578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,4,power_law_1.2,0.6486783981323242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,4,power_law_1.01,0.21902720928192138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,4,power_law_1.2,0.08102399706840516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,4,power_law_1.01,1.0798144340515137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,4,power_law_1.2,0.7490303993225098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,4,power_law_1.01,0.30769920349121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,4,power_law_1.2,0.09189119935035706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,4,power_law_1.2,0.9616255760192871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,4,power_law_1.01,1.3600000381469726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,4,power_law_1.01,0.38264319896697996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,4,power_law_1.2,0.10867199897766114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,4,power_law_1.01,0.5391104221343994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,4,power_law_1.2,1.5469247817993164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,4,power_law_1.2,0.13952640295028687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,4,power_law_1.01,3.2820480346679686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,4,power_law_1.01,0.7453504085540772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,4,power_law_1.2,0.1709247946739197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,4,power_law_1.2,3.2439041137695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,4,power_law_1.2,0.22439041137695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,4,power_law_1.01,0.9927424430847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,4,power_law_1.2,0.322271990776062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,4,power_law_1.01,2.4984384536743165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,4,power_law_1.2,0.44371838569641114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,2,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,4,power_law_1.2,0.5178624153137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,2,power_law_1.01,0.01775359958410263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,2,power_law_1.2,0.01873279958963394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,4,power_law_1.2,0.6774015903472901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,2,power_law_1.01,0.018367999792099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,2,power_law_1.2,0.017894400656223296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,2,power_law_1.01,0.040243199467658995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,2,power_law_1.01,0.018566399812698364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,4,power_law_1.2,1.1715968132019043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,2,power_law_1.01,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,2,power_law_1.2,0.01831679940223694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,2,power_law_1.01,0.019603200256824493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,2,power_law_1.01,0.03919999897480011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,2,power_law_1.2,0.01910399943590164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,4,power_law_1.2,2.642655944824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,2,power_law_1.01,0.021241599321365358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,2,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,2,power_law_1.2,0.021792000532150267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,2,power_law_1.01,0.022675199806690215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,2,power_law_1.01,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,2,power_law_1.2,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,2,power_law_1.01,0.023078399896621703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,2,power_law_1.01,0.04147199988365173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,2,power_law_1.2,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,2,power_law_1.2,0.0367680013179779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,2,power_law_1.01,0.023904000222682954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,2,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,2,power_law_1.2,0.023014399409294128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,2,power_law_1.2,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,2,power_law_1.01,0.024716800451278685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,2,power_law_1.01,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,2,power_law_1.2,0.024460799992084503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,2,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,2,power_law_1.01,0.025337600708007814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,2,power_law_1.01,0.042259201407432556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,2,power_law_1.2,0.025062400102615356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,2,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,2,power_law_1.01,0.029017600417137145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,2,power_law_1.01,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,2,power_law_1.2,0.025472000241279602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,2,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,2,power_law_1.01,0.029017600417137145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,2,power_law_1.01,0.044121599197387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,2,power_law_1.2,0.031007999181747438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,2,power_law_1.2,0.040678399801254275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,2,power_law_1.01,0.02900480031967163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,2,power_law_1.01,0.04575999975204468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,2,power_law_1.2,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,2,power_law_1.01,0.03187200129032135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,2,power_law_1.2,0.040678399801254275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,2,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,2,power_law_1.2,0.028748801350593566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,2,power_law_1.01,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,2,power_law_1.2,0.03985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,2,power_law_1.01,0.046988800168037415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,2,power_law_1.2,0.03407360017299652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,2,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,2,power_law_1.2,0.04108799993991852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,2,power_law_1.01,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,2,power_law_1.2,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,2,power_law_1.01,0.047040000557899475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,2,power_law_1.01,0.05763840079307556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,2,power_law_1.2,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,2,power_law_1.2,0.03898240029811859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,2,power_law_1.01,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,2,power_law_1.01,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,2,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,2,power_law_1.2,0.04535680115222931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,2,power_law_1.01,0.07448319792747497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,2,power_law_1.01,0.06870399713516236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,2,power_law_1.2,0.04478079974651337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,2,power_law_1.2,0.052095997333526614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,2,power_law_1.01,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,2,power_law_1.2,0.04620159864425659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,2,power_law_1.2,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,2,power_law_1.01,0.09245439767837524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,2,power_law_1.2,0.04580479860305786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,2,power_law_1.01,0.0996288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,2,power_law_1.2,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,2,power_law_1.2,0.0527616024017334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,2,power_law_1.01,0.12830079793930055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,2,power_law_1.2,0.12215039730072022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,2,power_law_1.2,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,2,power_law_1.01,0.15943039655685426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,2,power_law_1.2,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,2,power_law_1.2,0.13236479759216307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,2,power_law_1.01,0.21962239742279052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,2,power_law_1.2,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,2,power_law_1.2,0.19587199687957763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,2,power_law_1.01,0.29356160163879397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,2,power_law_1.2,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,2,power_law_1.2,0.27575039863586426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,2,power_law_1.01,0.3822335958480835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,2,power_law_1.2,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,2,power_law_1.2,0.3924799919128418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,2,power_law_1.01,0.5206975936889648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,2,power_law_1.2,0.10682879686355591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,2,power_law_1.2,0.5194431781768799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,2,power_law_1.2,0.14819200038909913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,2,power_law_1.01,0.6284095764160156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,2,power_law_1.2,0.5821119785308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,2,power_law_1.2,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,2,power_law_1.01,1.0062591552734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,2,power_law_1.2,0.9296575546264648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,2,power_law_1.2,0.21783039569854737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,2,power_law_1.01,2.047667121887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,2,power_law_1.2,2.108902359008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,2,power_law_1.2,0.2759871959686279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,2,power_law_1.2,0.35422720909118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,2,power_law_1.2,0.5944575786590576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,2,power_law_1.2,0.6347968101501464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,2,power_law_1.2,1.1048128128051757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,8,power_law_1.01,0.021798400580883025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,4,8,power_law_1.2,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,2,power_law_1.2,2.086227226257324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,8,power_law_1.01,0.022623999416828154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,4,8,power_law_1.2,0.021587200462818146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,8,power_law_1.01,0.022412799298763275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,4,8,power_law_1.2,0.021580800414085388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,8,power_law_1.01,0.022623999416828154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,4,8,power_law_1.2,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,8,power_law_1.01,0.023852799832820893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,8,power_law_1.01,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,4,8,power_law_1.2,0.02261119931936264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,8,power_law_1.01,0.02712959945201874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,8,power_law_1.01,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,4,8,power_law_1.2,0.02874239981174469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,8,power_law_1.01,0.02752000093460083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,8,power_law_1.01,0.04108160138130188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,4,8,power_law_1.2,0.02791680097579956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,8,power_law_1.01,0.033267199993133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,8,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,4,8,power_law_1.2,0.031200000643730165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,8,power_law_1.01,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,8,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,4,8,power_law_1.2,0.029164800047874452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,8,power_law_1.01,0.02958720028400421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,8,power_law_1.01,0.04232319891452789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,4,8,power_law_1.2,0.02999039888381958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,8,power_law_1.01,0.033062401413917544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,8,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,4,8,power_law_1.2,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,8,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,8,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,4,8,power_law_1.2,0.04247680008411407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,8,power_law_1.01,0.045535999536514285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,8,power_law_1.01,0.043558400869369504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,4,8,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,8,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,8,power_law_1.01,0.046003198623657225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,4,8,power_law_1.2,0.049235200881958006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,8,power_law_1.01,0.06071680188179016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,8,power_law_1.01,0.045798400044441225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,4,8,power_law_1.2,0.05619199872016907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,8,power_law_1.01,0.06154879927635193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,8,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,4,8,power_law_1.2,0.05945600271224975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,8,power_law_1.01,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,4,8,power_law_1.2,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,8,power_law_1.01,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,8,power_law_1.01,0.09224320054054261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,8,power_law_1.01,0.05318400263786316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,4,8,power_law_1.2,0.09162880182266235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,8,power_law_1.01,0.11539839506149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,8,power_law_1.01,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,4,8,power_law_1.2,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,8,power_law_1.01,0.1573632001876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,8,power_law_1.01,0.06763520240783691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,4,8,power_law_1.2,0.16350079774856568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,8,power_law_1.01,0.21799681186676026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,8,power_law_1.01,0.06567680239677429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,4,8,power_law_1.2,0.21389439105987548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,8,power_law_1.01,0.3044095993041992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,8,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,8,power_law_1.01,0.4111167907714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,4,8,power_law_1.2,0.30972800254821775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,8,power_law_1.01,0.0908415973186493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,8,power_law_1.01,0.5788479804992676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,4,8,power_law_1.2,0.40517759323120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,8,power_law_1.01,0.11585279703140258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,8,power_law_1.01,0.774841594696045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,4,8,power_law_1.2,0.6013631820678711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,8,power_law_1.01,0.14635519981384276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,8,power_law_1.01,1.1854592323303224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,4,8,power_law_1.2,0.7859072208404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,8,power_law_1.01,0.1924415946006775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,8,power_law_1.01,1.492454433441162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,4,8,power_law_1.2,1.2374719619750976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,8,power_law_1.01,0.22581119537353517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,8,power_law_1.01,1.9088064193725587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,4,8,power_law_1.2,1.5944512367248536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,8,power_law_1.01,0.32554240226745607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,8,power_law_1.01,3.139481544494629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,4,8,power_law_1.2,1.9546815872192382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,8,power_law_1.01,0.3763520002365112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,4,8,power_law_1.2,2.903321647644043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,8,power_law_1.01,6.180947113037109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,8,power_law_1.01,0.5580095767974853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,8,power_law_1.01,0.7941440105438232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,4,8,power_law_1.2,6.166604614257812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,8,power_law_1.01,0.9727168083190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,8,power_law_1.01,1.5707200050354004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,4,8,power_law_1.2,0.04351359903812409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,4,8,power_law_1.2,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,8,power_law_1.01,3.193574333190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,4,8,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,4,8,power_law_1.2,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,4,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,4,8,power_law_1.2,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,4,power_law_1.01,0.020550400018692017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,4,8,power_law_1.2,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,4,power_law_1.01,0.020960000157356263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,4,8,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,4,power_law_1.2,0.019359999895095827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,4,power_law_1.01,0.020563200116157532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,4,8,power_law_1.2,0.04492799937725067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,4,power_law_1.2,0.019167999923229217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,4,power_law_1.01,0.021376000344753267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,4,8,power_law_1.2,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,4,power_law_1.2,0.019993600249290467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,4,power_law_1.01,0.026707199215888978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,4,8,power_law_1.2,0.044947201013565065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,4,power_law_1.2,0.019577600061893463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,4,power_law_1.01,0.02547839879989624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,4,8,power_law_1.2,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,4,power_law_1.2,0.020403200387954713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,4,power_law_1.01,0.028748801350593566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,4,8,power_law_1.2,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,4,power_law_1.2,0.023270399868488313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,4,power_law_1.01,0.0271232008934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,4,8,power_law_1.2,0.052108800411224364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,4,power_law_1.2,0.022655999660491942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,4,power_law_1.01,0.02876160144805908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,4,8,power_law_1.2,0.055180799961090085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,4,power_law_1.2,0.024300800263881685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,4,power_law_1.01,0.03530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,4,8,power_law_1.2,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,4,power_law_1.2,0.025119999051094057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,4,power_law_1.01,0.03633280098438263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,4,8,power_law_1.2,0.06706560254096985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,4,power_law_1.2,0.025312000513076784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,4,power_law_1.01,0.038790398836135866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,4,8,power_law_1.2,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,4,power_law_1.2,0.026956799626350402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,4,power_law_1.01,0.04472959935665131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,4,8,power_law_1.2,0.08835840225219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,4,power_law_1.2,0.03187839984893799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,4,8,power_law_1.2,0.09901440143585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,4,power_law_1.01,0.04758400022983551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,4,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,4,8,power_law_1.2,0.11785600185394288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,4,power_law_1.01,0.051692801713943484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,4,8,power_law_1.2,0.13895039558410643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,4,power_law_1.2,0.03331199884414673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,4,power_law_1.01,0.06336640119552613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,4,8,power_law_1.2,0.18686720132827758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,4,power_law_1.2,0.045407998561859134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,4,power_law_1.01,0.07934079766273498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,4,8,power_law_1.2,0.23909120559692382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,4,power_law_1.01,0.09080320000648498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,4,power_law_1.2,0.04723199903964996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,4,8,power_law_1.2,0.3412928104400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,4,power_law_1.01,0.11230720281600952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,4,power_law_1.2,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,4,8,power_law_1.2,0.39495038986206055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,4,power_law_1.2,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,4,power_law_1.2,0.0810368001461029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,4,8,power_law_1.2,0.6112063884735107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,4,power_law_1.2,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,4,8,power_law_1.2,0.8251968383789062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,4,power_law_1.2,0.1322368025779724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,4,8,power_law_1.2,0.9419648170471191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,4,power_law_1.2,0.19285759925842286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,4,8,power_law_1.2,1.646067237854004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,4,power_law_1.2,0.2444607973098755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,4,8,power_law_1.2,3.3418048858642577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,4,power_law_1.2,0.356825590133667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,4,power_law_1.2,0.4686592102050781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,4,power_law_1.2,0.6946112155914307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,4,power_law_1.2,0.9207039833068847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,4,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,4,power_law_1.2,1.1453696250915528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,4,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,4,power_law_1.01,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,4,power_law_1.2,1.8185407638549804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,4,power_law_1.01,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,4,power_law_1.2,3.5939456939697267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,4,power_law_1.01,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,4,power_law_1.01,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,4,power_law_1.01,0.04302720129489899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,4,power_law_1.01,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,4,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,4,power_law_1.01,0.044121599197387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,4,power_law_1.2,0.04273279905319214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,4,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,4,power_law_1.2,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,4,power_law_1.01,0.044736000895500186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,4,power_law_1.01,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,4,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,4,power_law_1.01,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,4,power_law_1.2,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,4,power_law_1.01,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,4,power_law_1.2,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,4,power_law_1.01,0.06317440271377564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,4,power_law_1.2,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,4,power_law_1.01,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,4,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,4,power_law_1.01,0.06829439997673034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,4,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,4,power_law_1.01,0.08221439719200134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,4,power_law_1.2,0.043961599469184875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,4,power_law_1.01,0.091839998960495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,4,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,4,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,4,power_law_1.2,0.04948480129241943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,4,power_law_1.01,0.12153600454330445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,4,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,4,power_law_1.01,0.1692479968070984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,4,power_law_1.2,0.054201602935791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,4,power_law_1.01,0.19792640209197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,4,power_law_1.2,0.05952640175819397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,4,power_law_1.01,0.27370240688323977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,4,power_law_1.2,0.06484479904174804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,4,power_law_1.01,0.3720128059387207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,4,power_law_1.2,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,4,power_law_1.01,0.5567423820495605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,4,power_law_1.2,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,4,power_law_1.01,0.7621503829956054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,4,power_law_1.2,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,4,power_law_1.2,0.11215360164642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,4,power_law_1.01,0.7490303993225098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,4,power_law_1.2,0.14533120393753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,4,power_law_1.01,1.307539176940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,4,power_law_1.2,0.16110719442367555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,4,power_law_1.01,3.1253311157226564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,4,power_law_1.2,0.21290879249572753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,4,power_law_1.2,0.30337278842926024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,4,power_law_1.2,0.3814016103744507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,4,power_law_1.2,0.6949503898620606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,4,power_law_1.2,0.7437119960784913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,2,power_law_1.01,0.01996160000562668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,2,power_law_1.01,0.019763199985027312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,4,power_law_1.2,1.0124671936035157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,2,power_law_1.01,0.019756799936294554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,4,power_law_1.2,1.4718208312988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,2,power_law_1.01,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,4,power_law_1.2,3.0971200942993162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,2,power_law_1.01,0.020985600352287293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,2,power_law_1.01,0.022412799298763275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,2,power_law_1.01,0.02343679964542389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,2,power_law_1.01,0.0230335995554924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,2,power_law_1.01,0.024672000110149382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,2,power_law_1.01,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,2,power_law_1.2,0.0193792000412941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,2,power_law_1.01,0.08141440153121948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,2,power_law_1.01,0.025088000297546386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,2,power_law_1.2,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,2,power_law_1.01,0.1115455985069275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,2,power_law_1.01,0.031020799279212953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,2,power_law_1.2,0.01998720020055771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,2,power_law_1.01,0.12896000146865844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,2,power_law_1.01,0.030406400561332703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,2,power_law_1.2,0.021631999313831328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,2,power_law_1.01,0.20616960525512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,2,power_law_1.01,0.031225600838661195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,2,power_law_1.2,0.02245119959115982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,2,power_law_1.01,0.0328575998544693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,2,power_law_1.01,0.2532416105270386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,2,power_law_1.2,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,2,power_law_1.01,0.03325439989566803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,2,power_law_1.01,0.3274048089981079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,2,power_law_1.2,0.02531839907169342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,2,power_law_1.01,0.035519999265670774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,2,power_law_1.01,0.4263040065765381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,2,power_law_1.2,0.02449920028448105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,2,power_law_1.01,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,2,power_law_1.01,0.6337984085083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,2,power_law_1.2,0.027372801303863527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,2,power_law_1.01,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,2,power_law_1.2,0.02757120132446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,2,power_law_1.01,0.9133312225341796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,2,power_law_1.01,0.07464320063591004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,2,power_law_1.2,0.02675839960575104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,2,power_law_1.01,1.9076480865478516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,2,power_law_1.01,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,2,power_law_1.2,0.0322816014289856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,2,power_law_1.01,0.12951040267944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,2,power_law_1.2,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,2,power_law_1.01,0.15512319803237914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,2,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,2,power_law_1.01,0.22783360481262208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,2,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,2,power_law_1.01,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,2,power_law_1.01,0.28682239055633546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,2,power_law_1.2,0.03800959885120392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,2,power_law_1.01,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,2,power_law_1.01,0.41539840698242186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,2,power_law_1.2,0.05050240159034729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,2,power_law_1.01,0.04167680144309997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,2,power_law_1.2,0.059935998916625974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,2,power_law_1.01,0.5419839859008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,2,power_law_1.01,0.044352000951766966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,2,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,2,power_law_1.01,0.6732736110687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,2,power_law_1.01,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,2,power_law_1.2,0.09373440146446228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,2,power_law_1.01,1.0634048461914063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,2,power_law_1.01,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,2,power_law_1.2,0.11235840320587158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,2,power_law_1.01,2.104198455810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,2,power_law_1.01,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,2,power_law_1.2,0.16212480068206786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,2,power_law_1.01,0.045407998561859134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,2,power_law_1.2,0.20902400016784667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,2,power_law_1.01,0.046009600162506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,2,power_law_1.2,0.2684096097946167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,2,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,2,power_law_1.2,0.40952320098876954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,2,power_law_1.2,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,2,power_law_1.01,0.047244799137115476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,2,power_law_1.2,0.6108416080474853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,2,power_law_1.2,0.04264959990978241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,2,power_law_1.01,0.04805760085582733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,2,power_law_1.2,0.728601598739624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,2,power_law_1.2,0.043699198961257936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,2,power_law_1.01,0.0486847996711731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,2,power_law_1.2,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,2,power_law_1.2,1.0781951904296876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,2,power_law_1.01,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,2,power_law_1.2,0.04576640129089356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,2,power_law_1.01,0.06034560203552246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,2,power_law_1.2,1.4513471603393555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,2,power_law_1.2,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,2,power_law_1.01,0.06649600267410279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,2,power_law_1.2,3.1649023056030274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,2,power_law_1.2,0.04658559858798981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,2,power_law_1.01,0.06936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,2,power_law_1.2,0.04616959989070892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,2,power_law_1.01,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,2,power_law_1.2,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,2,power_law_1.01,0.08432000279426574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,2,power_law_1.2,0.04657920002937317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,1,power_law_1.01,0.018771199882030486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,2,power_law_1.01,0.11093759536743164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,2,power_law_1.2,0.04822399914264679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,1,power_law_1.01,0.018969599902629853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,2,power_law_1.01,0.13470079898834228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,2,power_law_1.2,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,1,power_law_1.01,0.019596800208091736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,2,power_law_1.01,0.15312639474868775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,2,power_law_1.2,0.05048959851264954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,1,power_law_1.01,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,2,power_law_1.01,0.18486399650573732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,2,power_law_1.2,0.05415679812431336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,1,power_law_1.01,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,2,power_law_1.01,0.281113600730896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,2,power_law_1.2,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,1,power_law_1.01,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,2,power_law_1.01,0.3714303970336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,2,power_law_1.2,0.06624000072479248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,1,power_law_1.01,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,2,power_law_1.2,0.06683520078659058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,2,power_law_1.01,0.519923210144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,1,power_law_1.01,0.023660799860954283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,2,power_law_1.2,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,2,power_law_1.01,0.6393152236938476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,1,power_law_1.01,0.025113600492477416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,2,power_law_1.2,0.08651520013809204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,2,power_law_1.01,0.7863552093505859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,1,power_law_1.01,0.02573440074920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,2,power_law_1.2,0.10556800365447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,2,power_law_1.01,1.3243712425231933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,1,power_law_1.01,0.026547199487686156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,2,power_law_1.2,0.1340288043022156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,1,power_law_1.01,0.031673601269721983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,2,power_law_1.01,2.5914751052856446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,2,power_law_1.2,0.1774335980415344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,1,power_law_1.01,0.03248000144958496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,2,power_law_1.2,0.22228479385375977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,1,power_law_1.01,0.03372800052165985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,2,power_law_1.2,0.2736959934234619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,1,power_law_1.01,0.034534400701522826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,2,power_law_1.2,0.370579195022583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,1,power_law_1.01,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,1,power_law_1.2,0.018566399812698364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,2,power_law_1.2,0.5391232013702393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,1,power_law_1.01,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,1,power_law_1.2,0.01918720006942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,2,power_law_1.2,0.6687359809875488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,1,power_law_1.01,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,1,power_law_1.2,0.018969599902629853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,2,power_law_1.2,0.8014719963073731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.01,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,1,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,2,power_law_1.2,1.2505855560302734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,1,power_law_1.2,0.019808000326156615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.01,0.09986559748649597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,1,power_law_1.2,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,2,power_law_1.2,2.7808704376220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.01,0.1373568058013916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,1,power_law_1.2,0.02205439954996109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.01,0.16643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,1,power_law_1.2,0.022668799757957457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.01,0.24364159107208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,1,power_law_1.2,0.023686400055885314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,1,power_law_1.2,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.01,0.3091840028762817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,1,power_law_1.01,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,1,power_law_1.2,0.025119999051094057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.01,0.44945921897888186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,1,power_law_1.01,0.042080000042915344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,1,power_law_1.2,0.029836800694465638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.01,0.5932223796844482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,1,power_law_1.01,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,1,power_law_1.2,0.030035200715065002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,1,power_law_1.01,0.7265535831451416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,1,power_law_1.01,0.04801279902458191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,1,power_law_1.2,0.03229439854621887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,1,power_law_1.01,1.152735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,1,power_law_1.01,0.048825600743293764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,1,power_law_1.2,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,1,power_law_1.01,2.2635776519775392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,1,power_law_1.01,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,1,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,1,power_law_1.01,0.049235200881958006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,1,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,1,power_law_1.01,0.049856001138687135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,1,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,1,power_law_1.01,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.2,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,1,power_law_1.01,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,1,power_law_1.2,0.040678399801254275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.2,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,1,power_law_1.01,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,1,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,1,power_law_1.01,0.05456640124320984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,1,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.2,0.13714560270309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,1,power_law_1.01,0.05619840025901794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,1,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.2,0.16601599454879762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,1,power_law_1.01,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,1,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.2,0.24263041019439696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,1,power_law_1.01,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,1,power_law_1.2,0.04805760085582733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.2,0.3087680101394653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,1,power_law_1.01,0.06664320230484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,1,power_law_1.2,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.2,0.45151357650756835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,1,power_law_1.01,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,1,power_law_1.2,0.048256000876426695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.2,0.585862398147583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,1,power_law_1.01,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,1,power_law_1.2,0.04929920136928558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,4,power_law_1.01,0.1463104009628296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.01,0.09654399752616882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,1,power_law_1.2,0.7265664100646972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,1,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,4,power_law_1.01,0.21881599426269532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.01,0.11489919424057007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,1,power_law_1.2,1.1478400230407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,1,power_law_1.2,0.04928640127182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,4,power_law_1.01,0.27409920692443845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.01,0.13483519554138185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,1,power_law_1.2,2.2680896759033202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,1,power_law_1.2,0.05297279953956604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,4,power_law_1.01,0.4489920139312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.01,0.17437440156936646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,1,power_law_1.2,0.055615997314453124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,4,power_law_1.01,0.6949567794799805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.01,0.2081536054611206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,1,power_law_1.2,0.05600000023841858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,4,power_law_1.01,0.8424127578735352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.01,0.2888511896133423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,1,power_law_1.2,0.06402559876441956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.01,0.3654592037200928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,4,power_law_1.01,1.137945556640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,1,power_law_1.2,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.01,0.5235455989837646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,4,power_law_1.01,1.4029696464538575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,1,power_law_1.2,0.07363839745521546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.01,0.6736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,1,power_law_1.2,0.08429440259933471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,4,power_law_1.01,2.2495872497558596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,1,power_law_1.01,0.832153606414795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.2,0.09598720073699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,4,power_law_1.01,5.0613056182861325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,1,power_law_1.01,1.3054783821105957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.2,0.11216000318527222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.2,0.13345279693603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,1,power_law_1.01,2.646297645568848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.2,0.17256959676742553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.2,0.20472319126129152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,32,power_law_1.01,0.051744002103805545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.2,0.2847935914993286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,32,power_law_1.01,0.05278080105781555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.2,0.36160640716552733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,32,power_law_1.01,0.09815040230751038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,32,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.2,0.5178624153137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,32,power_law_1.01,0.09347839951515198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.2,0.6728960037231445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,32,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,32,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,1,power_law_1.2,0.8223999977111817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,32,power_law_1.01,0.0486847996711731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,1,power_law_1.2,1.3071616172790528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,32,power_law_1.01,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,32,power_law_1.01,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,1,power_law_1.2,2.6246463775634767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,32,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,32,power_law_1.01,0.06176000237464905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,32,power_law_1.2,0.05189759731292724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,32,power_law_1.01,0.08813440203666686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,32,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,32,power_law_1.2,0.05229439735412598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,32,power_law_1.01,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,32,power_law_1.01,0.07408639788627625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,32,power_law_1.2,0.03591679930686951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,32,power_law_1.01,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,32,power_law_1.2,0.04431999921798706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,32,power_law_1.01,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,32,power_law_1.2,0.09781759977340698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,32,power_law_1.01,0.09428480267524719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,32,power_law_1.01,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,32,power_law_1.2,0.04593920111656189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,32,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,32,power_law_1.01,0.09553279876708984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,32,power_law_1.01,0.1162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,32,power_law_1.2,0.05373439788818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,32,power_law_1.2,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,32,power_law_1.01,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,32,power_law_1.2,0.054764801263809205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,32,power_law_1.01,0.13101439476013182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,32,power_law_1.2,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,32,power_law_1.01,0.09819520115852357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,32,power_law_1.01,0.16111359596252442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,32,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,32,power_law_1.2,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,32,power_law_1.01,0.09880319833755494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,32,power_law_1.01,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,32,power_law_1.2,0.06766719818115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,32,power_law_1.2,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,32,power_law_1.01,0.09778559803962708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,32,power_law_1.2,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,32,power_law_1.01,0.1404031991958618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,32,power_law_1.2,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,32,power_law_1.01,0.10618239641189575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,32,power_law_1.01,0.17482880353927613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,32,power_law_1.2,0.0850816011428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,32,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,32,power_law_1.01,0.1098688006401062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,32,power_law_1.01,0.15189119577407836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,32,power_law_1.2,0.10104960203170776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,32,power_law_1.2,0.09207680225372314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,32,power_law_1.01,0.11639039516448975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,32,power_law_1.2,0.11844480037689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.01,0.19120639562606812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,32,power_law_1.2,0.09618560075759888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,32,power_law_1.01,0.12912000417709352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.01,0.25408639907836916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,32,power_law_1.2,0.1471295952796936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,32,power_law_1.2,0.09349759817123413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.01,0.14920320510864257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.01,0.307532811164856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,32,power_law_1.2,0.09699199795722961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.01,0.17171839475631714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.01,0.1790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,32,power_law_1.2,0.0986303985118866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.01,0.4724031925201416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.01,0.22558081150054932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,32,power_law_1.2,0.10008959770202637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.01,0.6288447856903077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,32,power_law_1.2,0.10726399421691894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.01,0.2704063892364502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.01,0.9768383979797364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,32,power_law_1.2,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.01,0.34332799911499023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.01,1.1912511825561523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,32,power_law_1.2,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.01,0.4318079948425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.01,1.930988883972168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,32,power_law_1.2,0.13509759902954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.01,0.6153024196624756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.01,2.5894079208374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.2,0.14801280498504638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.01,0.82357759475708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,32,power_law_1.01,2.893951988220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.2,0.17400959730148316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,32,power_law_1.01,0.9419520378112793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,32,power_law_1.01,4.967974472045898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.2,0.1842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,32,power_law_1.01,1.420576000213623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.2,0.22909440994262695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,32,power_law_1.01,10.164153289794921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.2,0.2812608003616333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,32,power_law_1.01,2.798054313659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.2,0.410752010345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.2,0.48633599281311035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.2,0.6617792129516602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.2,0.9210432052612305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,32,power_law_1.2,1.2096128463745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,16,power_law_1.2,0.02446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,16,power_law_1.2,0.025900799036026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,16,power_law_1.01,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,32,power_law_1.2,1.881216049194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,16,power_law_1.01,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,16,power_law_1.2,0.026719999313354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,16,power_law_1.2,0.026918399333953857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,32,power_law_1.2,3.7856510162353514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,16,power_law_1.2,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,16,power_law_1.2,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,16,power_law_1.2,0.049446401000022885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,16,power_law_1.01,0.08081920146942138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,16,power_law_1.2,0.060096001625061034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,16,power_law_1.01,0.10929280519485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,16,power_law_1.2,0.060915201902389526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,16,power_law_1.01,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,16,power_law_1.2,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,16,power_law_1.01,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,16,power_law_1.2,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,16,power_law_1.2,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,16,power_law_1.01,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,16,power_law_1.2,0.11088639497756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,16,power_law_1.01,0.08512639999389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,16,power_law_1.2,0.14016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,16,power_law_1.01,0.0949504017829895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,16,power_law_1.2,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,16,power_law_1.01,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,16,power_law_1.2,0.11887359619140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,16,power_law_1.01,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,16,power_law_1.2,0.15102720260620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,16,power_law_1.01,0.10028159618377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,16,power_law_1.2,0.12910720109939575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,16,power_law_1.01,0.10088959932327271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,16,power_law_1.2,0.16085120439529418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,16,power_law_1.01,0.10314240455627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,16,power_law_1.2,0.22639999389648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,16,power_law_1.01,0.10397440195083618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,16,power_law_1.2,0.2859904050827026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,16,power_law_1.01,0.1060096025466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,16,power_law_1.2,0.41623678207397463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,16,power_law_1.01,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,16,power_law_1.01,0.11626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,16,power_law_1.2,0.5407487869262695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,16,power_law_1.01,0.12076799869537354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,16,power_law_1.2,0.8002431869506836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,16,power_law_1.01,0.14204800128936768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,16,power_law_1.2,1.061292839050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,16,power_law_1.01,0.14737919569015503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,16,power_law_1.2,1.5846336364746094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,16,power_law_1.01,0.174835205078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,16,power_law_1.2,2.1099456787109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,16,power_law_1.01,0.19141759872436523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,16,power_law_1.2,2.6331903457641603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,16,power_law_1.01,0.23934080600738525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,16,power_law_1.2,4.202982330322266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,16,power_law_1.01,0.28215680122375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,16,power_law_1.01,0.38331520557403564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,16,power_law_1.2,8.318854522705077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,16,power_law_1.01,0.4379263877868652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,16,power_law_1.01,0.6329599857330322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,16,power_law_1.01,0.772435188293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,16,power_law_1.2,0.08222079873085023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,16,power_law_1.01,0.9424127578735352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,16,power_law_1.2,0.1086400032043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,16,power_law_1.01,1.4595392227172852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,16,power_law_1.2,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,16,power_law_1.2,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,16,power_law_1.01,2.9349056243896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,16,power_law_1.2,0.07668480277061462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,16,power_law_1.2,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,16,power_law_1.2,0.09512320160865784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,16,power_law_1.2,0.09799039959907532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,8,power_law_1.01,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,16,power_law_1.2,0.10126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,8,power_law_1.01,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,16,power_law_1.2,0.10023679733276367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,8,power_law_1.01,0.023481599986553192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,16,power_law_1.2,0.10451840162277222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,8,power_law_1.01,0.0236735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,16,power_law_1.2,0.10700160264968872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,8,power_law_1.01,0.025727999210357667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,16,power_law_1.2,0.10618239641189575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,8,power_law_1.01,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,16,power_law_1.2,0.10782079696655274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,8,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,16,power_law_1.2,0.11477760076522828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,8,power_law_1.01,0.04805119931697845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,16,power_law_1.2,0.12133760452270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,8,power_law_1.01,0.052160000801086424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,16,power_law_1.2,0.12215039730072022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,8,power_law_1.01,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,16,power_law_1.2,0.1414080023765564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,8,power_law_1.01,0.07223680019378662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,16,power_law_1.2,0.15697280168533326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,8,power_law_1.01,0.07530879974365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,8,power_law_1.01,0.0847104012966156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,16,power_law_1.2,0.18544000387191772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,8,power_law_1.01,0.10438400506973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,16,power_law_1.2,0.20181760787963868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,16,power_law_1.2,0.24829440116882323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,8,power_law_1.01,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,16,power_law_1.2,0.3150719881057739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,8,power_law_1.01,0.09312000274658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,8,power_law_1.01,0.11503360271453858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,16,power_law_1.2,0.38798720836639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,8,power_law_1.01,0.10682879686355591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,16,power_law_1.2,0.47318401336669924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,8,power_law_1.01,0.1326464056968689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,16,power_law_1.2,0.6695871829986573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,8,power_law_1.01,0.17769600152969361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,16,power_law_1.2,0.8689984321594239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,8,power_law_1.01,0.22271358966827393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,16,power_law_1.2,1.1445183753967285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,8,power_law_1.01,0.31612799167633054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,16,power_law_1.2,1.8156415939331054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,8,power_law_1.01,0.4103360176086426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,8,power_law_1.01,0.6075776100158692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,16,power_law_1.2,3.9510208129882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,8,power_law_1.01,0.7936063766479492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,8,power_law_1.01,1.182579231262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,8,power_law_1.01,1.574841594696045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,8,power_law_1.01,1.9625152587890624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,8,power_law_1.2,0.0230335995554924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,8,power_law_1.2,0.02343039959669113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,8,power_law_1.01,3.1167680740356447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,8,power_law_1.2,0.024665600061416625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,8,power_law_1.01,6.214982223510742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,8,power_law_1.2,0.025279998779296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,8,power_law_1.2,0.028358399868011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,8,power_law_1.2,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,8,power_law_1.2,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,8,power_law_1.01,0.06995199918746949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,8,power_law_1.2,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,8,power_law_1.01,0.0896127998828888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,8,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,8,power_law_1.01,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,8,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,8,power_law_1.01,0.07446399927139283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,8,power_law_1.2,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,8,power_law_1.01,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,8,power_law_1.2,0.08603519797325135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,8,power_law_1.2,0.09839360117912292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,8,power_law_1.01,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,8,power_law_1.2,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,8,power_law_1.01,0.10558719635009765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,8,power_law_1.2,0.0936959981918335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,8,power_law_1.01,0.10968960523605346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,8,power_law_1.2,0.11025919914245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,8,power_law_1.01,0.11338239908218384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,8,power_law_1.2,0.13360639810562133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,8,power_law_1.01,0.11196160316467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,8,power_law_1.2,0.12543359994888306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,8,power_law_1.01,0.11830400228500366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,32,power_law_1.2,0.10044159889221191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,8,power_law_1.2,0.1504320025444031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,8,power_law_1.01,0.11624319553375244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,32,power_law_1.2,0.11723519563674926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,8,power_law_1.2,0.21473278999328613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,8,power_law_1.01,0.12136960029602051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,32,power_law_1.2,0.15634560585021973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,8,power_law_1.2,0.25138559341430666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,8,power_law_1.01,0.12281600236892701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,32,power_law_1.2,0.1323904037475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,8,power_law_1.2,0.3769279956817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,8,power_law_1.01,0.12896000146865844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.2,0.17047040462493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,8,power_law_1.2,0.5055424213409424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,8,power_law_1.01,0.13304959535598754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.2,0.24605441093444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,8,power_law_1.01,0.14165120124816893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,8,power_law_1.2,0.7539584159851074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.2,0.27492480278015136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,8,power_law_1.01,0.15781760215759277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,8,power_law_1.2,1.0132287979125976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.2,0.41132798194885256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,8,power_law_1.01,0.17891839742660523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,8,power_law_1.2,1.443507194519043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.2,0.5661503791809082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,8,power_law_1.01,0.20453119277954102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.2,0.8567359924316407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,8,power_law_1.2,1.929702377319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,8,power_law_1.01,0.22849280834198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.2,1.0736191749572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,8,power_law_1.2,2.5398080825805662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,8,power_law_1.01,0.2755840063095093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.2,1.7496768951416015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,8,power_law_1.01,0.3190079927444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,8,power_law_1.2,3.942073440551758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.2,2.4988479614257812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,8,power_law_1.01,0.41199359893798826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,8,power_law_1.2,7.584844970703125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,8,power_law_1.01,0.5055168151855469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,32,power_law_1.2,3.070783996582031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,8,power_law_1.01,0.6987008094787598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,32,power_law_1.2,5.179206466674804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,8,power_law_1.01,0.9551103591918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,8,power_law_1.2,0.0840448021888733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,32,power_law_1.2,9.935539245605469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,8,power_law_1.01,1.1474111557006836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,8,power_law_1.2,0.08487679958343505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,16,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,8,power_law_1.01,1.6899328231811523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,8,power_law_1.2,0.06993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,16,power_law_1.01,0.0350847989320755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,8,power_law_1.2,0.0744383990764618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,16,power_law_1.01,0.049497601389884946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,4,power_law_1.01,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,8,power_law_1.01,3.3717247009277345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,8,power_law_1.2,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,16,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,4,power_law_1.01,0.023628799617290495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,8,power_law_1.2,0.08692479729652405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,16,power_law_1.01,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,4,power_law_1.01,0.02588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,8,power_law_1.2,0.10883840322494506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,16,power_law_1.01,0.06116480231285095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,4,power_law_1.2,0.02143999934196472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,4,power_law_1.01,0.030399999022483824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,8,power_law_1.2,0.11477760076522828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,16,power_law_1.01,0.06321920156478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,4,power_law_1.2,0.021836799383163453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,4,power_law_1.01,0.03550719916820526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,8,power_law_1.2,0.11293439865112305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,16,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,4,power_law_1.2,0.023686400055885314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,4,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,8,power_law_1.2,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,16,power_law_1.01,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,4,power_law_1.2,0.02675839960575104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,4,power_law_1.01,0.05292159914970398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,8,power_law_1.2,0.11662080287933349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,16,power_law_1.01,0.08778240084648133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,4,power_law_1.2,0.028595200181007384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,4,power_law_1.01,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,8,power_law_1.2,0.11804800033569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,16,power_law_1.01,0.09966719746589661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,4,power_law_1.2,0.03371520042419433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,4,power_law_1.01,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,8,power_law_1.2,0.11969920396804809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,16,power_law_1.01,0.11871999502182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,4,power_law_1.2,0.04314880073070526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,4,power_law_1.01,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,8,power_law_1.2,0.12870399951934813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,16,power_law_1.01,0.09210879802703857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,4,power_law_1.2,0.047040000557899475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,4,power_law_1.01,0.0725823998451233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,8,power_law_1.2,0.13137279748916625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,16,power_law_1.01,0.1035647988319397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,4,power_law_1.2,0.051052802801132204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,4,power_law_1.01,0.07830399870872498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,8,power_law_1.2,0.13996800184249877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,16,power_law_1.01,0.12650879621505737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,4,power_law_1.2,0.059513598680496216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,4,power_law_1.01,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,8,power_law_1.2,0.14816639423370362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,16,power_law_1.01,0.11276799440383911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,4,power_law_1.2,0.070796799659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,4,power_law_1.01,0.10085120201110839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,8,power_law_1.2,0.1708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,4,power_law_1.2,0.07978879809379577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,16,power_law_1.01,0.13408639430999755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,4,power_law_1.01,0.08344320058822632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,8,power_law_1.2,0.1860479950904846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,4,power_law_1.2,0.09166719913482665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,16,power_law_1.01,0.17830400466918944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,4,power_law_1.01,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,8,power_law_1.2,0.2151360034942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,4,power_law_1.2,0.11623680591583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,16,power_law_1.01,0.22561280727386473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,4,power_law_1.01,0.10822399854660034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,8,power_law_1.2,0.23007359504699706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,4,power_law_1.2,0.0890175998210907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,16,power_law_1.01,0.3095936059951782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,4,power_law_1.01,0.10944639444351197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,8,power_law_1.2,0.2915263891220093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,4,power_law_1.2,0.10149760246276855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,16,power_law_1.01,0.41239681243896487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,4,power_law_1.01,0.12645119428634644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,8,power_law_1.2,0.3283776044845581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,4,power_law_1.2,0.1285375952720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,16,power_law_1.01,0.614137601852417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,4,power_law_1.01,0.1422144055366516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,8,power_law_1.2,0.445740795135498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,4,power_law_1.2,0.1240447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,4,power_law_1.01,0.1671872019767761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,16,power_law_1.01,0.7736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,8,power_law_1.2,0.5948031902313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,4,power_law_1.2,0.15475840568542482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,4,power_law_1.01,0.21758720874786378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,16,power_law_1.01,1.2068160057067872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,4,power_law_1.2,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,8,power_law_1.2,0.8133440017700195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,4,power_law_1.01,0.27901439666748046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,16,power_law_1.01,1.5613247871398925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,4,power_law_1.2,0.20881280899047852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,4,power_law_1.01,0.3904320001602173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,8,power_law_1.2,1.0148672103881835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,16,power_law_1.01,1.8974271774291993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,4,power_law_1.2,0.297708797454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,4,power_law_1.01,0.5170048236846924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,8,power_law_1.2,1.2219136238098145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,16,power_law_1.01,2.984063911437988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,4,power_law_1.2,0.3873984098434448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,4,power_law_1.01,0.740831995010376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,8,power_law_1.2,2.007097625732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,4,power_law_1.2,0.5440639972686767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,16,power_law_1.01,5.740057754516601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,4,power_law_1.01,0.926790428161621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,4,power_law_1.2,0.747436809539795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,8,power_law_1.2,4.3928382873535154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,4,power_law_1.01,1.1674431800842284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,4,power_law_1.2,1.0667263984680175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,4,power_law_1.01,1.875014305114746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,4,power_law_1.2,1.462393569946289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,4,power_law_1.01,3.672140884399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,4,power_law_1.2,1.8222335815429687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,4,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,4,power_law_1.01,0.08615040183067321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,4,power_law_1.2,2.876422309875488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,4,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,2,power_law_1.01,0.02136960029602051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,4,power_law_1.01,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,4,power_law_1.2,5.741279983520508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,2,power_law_1.01,0.023628799617290495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,4,power_law_1.01,0.09168639779090881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,4,power_law_1.01,0.1095039963722229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,2,power_law_1.01,0.024454399943351746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,2,power_law_1.2,0.021638399362564086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,4,power_law_1.01,0.13162239789962768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,2,power_law_1.01,0.03162240087985992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,2,power_law_1.2,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,4,power_law_1.01,0.1338688015937805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,2,power_law_1.01,0.041247999668121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,2,power_law_1.2,0.0236735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,4,power_law_1.01,0.13552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,2,power_law_1.01,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,4,power_law_1.01,0.13960959911346435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,2,power_law_1.2,0.026969599723815917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,2,power_law_1.01,0.06377599835395813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,4,power_law_1.01,0.1453503966331482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,2,power_law_1.2,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,2,power_law_1.01,0.06726400256156921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,4,power_law_1.01,0.14718079566955566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,2,power_law_1.2,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,2,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,2,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,4,power_law_1.01,0.14739840030670165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,2,power_law_1.01,0.07379199862480164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,2,power_law_1.2,0.04579200148582459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,4,power_law_1.01,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,2,power_law_1.01,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,2,power_law_1.2,0.055027198791503903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,4,power_law_1.01,0.16316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,2,power_law_1.01,0.09059839844703674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,2,power_law_1.2,0.058303999900817874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,4,power_law_1.01,0.16828800439834596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,2,power_law_1.01,0.09607040286064147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,2,power_law_1.2,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,4,power_law_1.01,0.18016639947891236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,2,power_law_1.01,0.11149439811706544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,2,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,4,power_law_1.01,0.2055488109588623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,2,power_law_1.01,0.10064640045166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,2,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,4,power_law_1.01,0.2264319896697998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,2,power_law_1.01,0.10698239803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,2,power_law_1.2,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,4,power_law_1.01,0.2643392086029053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,2,power_law_1.01,0.12460800409317016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,2,power_law_1.2,0.08512639999389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,4,power_law_1.01,0.27683200836181643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,2,power_law_1.01,0.12621439695358277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,2,power_law_1.2,0.09434880018234253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,4,power_law_1.01,0.35015039443969725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,2,power_law_1.01,0.14877439737319947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,2,power_law_1.2,0.1158336043357849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,4,power_law_1.01,0.4019455909729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,2,power_law_1.01,0.16225919723510743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,2,power_law_1.2,0.11441919803619385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,4,power_law_1.01,0.535481595993042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,2,power_law_1.01,0.19607679843902587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,2,power_law_1.2,0.13939839601516724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,2,power_law_1.01,0.25253119468688967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,4,power_law_1.01,0.6782336235046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,2,power_law_1.2,0.15556479692459108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,2,power_law_1.01,0.3052351951599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,4,power_law_1.01,0.932588768005371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,2,power_law_1.2,0.19203200340270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,2,power_law_1.01,0.4223872184753418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,4,power_law_1.01,1.2293567657470703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,2,power_law_1.2,0.2604351997375488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,2,power_law_1.01,0.5304895877838135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,4,power_law_1.01,1.4521727561950684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,2,power_law_1.2,0.33703041076660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,2,power_law_1.01,0.7879487991333007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,4,power_law_1.01,2.1353792190551757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,2,power_law_1.2,0.4793600082397461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,2,power_law_1.01,0.9980671882629395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,2,power_law_1.2,0.6276288032531738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,4,power_law_1.01,4.333913421630859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,2,power_law_1.01,1.237062358856201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,2,power_law_1.2,0.9231743812561035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,2,power_law_1.2,1.2104384422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,2,power_law_1.2,1.4863552093505858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,2,power_law_1.2,2.296767997741699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,2,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,2,power_law_1.2,4.6236927032470705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,2,power_law_1.01,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,2,power_law_1.01,0.08696960210800171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,2,power_law_1.01,0.10110080242156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,2,power_law_1.01,0.1211583971977234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,2,power_law_1.01,0.1455423951148987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,2,power_law_1.01,0.18384640216827391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,2,power_law_1.2,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,2,power_law_1.01,0.18508800268173217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,2,power_law_1.2,0.08984320163726807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,2,power_law_1.01,0.1908031940460205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,2,power_law_1.2,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,2,power_law_1.01,0.1994047999382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,2,power_law_1.2,0.09740800261497498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,2,power_law_1.01,0.21047039031982423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,2,power_law_1.2,0.11256959438323974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,2,power_law_1.01,0.2178431987762451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,2,power_law_1.2,0.13058559894561766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,2,power_law_1.01,0.21907200813293456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,2,power_law_1.2,0.17482240200042726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,2,power_law_1.01,0.2239936113357544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,2,power_law_1.2,0.1852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,2,power_law_1.01,0.23382399082183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,2,power_law_1.2,0.1903872013092041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,2,power_law_1.01,0.24343678951263428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,2,power_law_1.2,0.1942911982536316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,2,power_law_1.01,0.26064000129699705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,2,power_law_1.2,0.2075968027114868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,2,power_law_1.01,0.3005824089050293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,2,power_law_1.2,0.21210238933563233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,2,power_law_1.01,0.3247488021850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,2,power_law_1.2,0.21434879302978516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,2,power_law_1.01,0.38290560245513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,2,power_law_1.2,0.23832321166992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,2,power_law_1.01,0.4339136123657227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,2,power_law_1.2,0.2469183921813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,2,power_law_1.01,0.5313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,2,power_law_1.2,0.2561280012130737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,2,power_law_1.2,0.2735487937927246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,2,power_law_1.01,0.6141312122344971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,2,power_law_1.2,0.30522239208221436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,2,power_law_1.01,0.8459712028503418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,2,power_law_1.2,0.3304768085479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,2,power_law_1.01,1.0452223777770997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,2,power_law_1.2,0.39151360988616946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,2,power_law_1.01,1.4345600128173828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,2,power_law_1.2,0.43390722274780275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,2,power_law_1.01,1.8066688537597657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,2,power_law_1.2,0.5375232219696044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,2,power_law_1.01,2.2054271697998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,2,power_law_1.2,0.6309247970581054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,2,power_law_1.01,3.445907211303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,2,power_law_1.2,0.8547776222229004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,2,power_law_1.2,1.0382464408874512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,2,power_law_1.01,6.671501159667969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,2,power_law_1.2,1.4786879539489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,2,power_law_1.2,1.8940544128417969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,2,power_law_1.2,2.182067108154297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,32,power_law_1.01,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,2,power_law_1.2,3.5564735412597654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,32,power_law_1.01,0.020428800582885744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,32,power_law_1.01,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,2,power_law_1.2,7.102175903320313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,32,power_law_1.01,0.020614400506019592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,32,power_law_1.01,0.023904000222682954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,32,power_law_1.01,0.02655999958515167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,32,power_law_1.01,0.031891199946403506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,32,power_law_1.01,0.03219200074672699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,32,power_law_1.2,0.020403200387954713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,32,power_law_1.01,0.03331199884414673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,32,power_law_1.2,0.01958400011062622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,32,power_law_1.01,0.03658879995346069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,32,power_law_1.2,0.020211200416088104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,32,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,32,power_law_1.2,0.020396800339221956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,32,power_law_1.01,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,32,power_law_1.2,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,32,power_law_1.01,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,32,power_law_1.2,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,32,power_law_1.01,0.04540160000324249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,32,power_law_1.2,0.03230080008506775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,32,power_law_1.01,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,32,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,32,power_law_1.01,0.041459199786186215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,32,power_law_1.2,0.03391999900341034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,32,power_law_1.01,0.04826880097389221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,32,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,32,power_law_1.01,0.06874240040779114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,32,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,32,power_law_1.2,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.01,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,32,power_law_1.2,0.04047360122203827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.01,0.10725760459899902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,32,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.01,0.13018239736557008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,32,power_law_1.2,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.01,0.18629759550094604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,32,power_law_1.2,0.04619520008563995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.01,0.27026560306549074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,32,power_law_1.2,0.051532799005508424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.01,0.3767616033554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,32,power_law_1.2,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.01,0.49288320541381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.2,0.08409600257873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.01,0.6671679973602295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.2,0.12895359992980956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.01,1.006726360321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.2,0.14369280338287355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,32,power_law_1.01,1.2309887886047364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.2,0.23338239192962645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.2,0.28664960861206057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,32,power_law_1.01,1.8156927108764649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.2,0.45598721504211426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,32,power_law_1.01,4.049651336669922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.2,0.700275182723999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.2,0.9824959754943847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.2,1.1719807624816894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,4,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,32,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,32,power_law_1.2,1.62030086517334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,4,power_law_1.2,0.08692479729652405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,32,power_law_1.01,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,32,power_law_1.2,2.3993663787841797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,4,power_law_1.2,0.06870399713516236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,32,power_law_1.01,0.039673599600791934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,32,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,4,power_law_1.2,0.07626879811286927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,32,power_law_1.2,5.449849700927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,32,power_law_1.01,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,4,power_law_1.2,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,32,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,4,power_law_1.2,0.10003199577331542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,32,power_law_1.01,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,4,power_law_1.2,0.1254207968711853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,32,power_law_1.2,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,32,power_law_1.01,0.04314880073070526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,32,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,4,power_law_1.2,0.1340288043022156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,32,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,32,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,4,power_law_1.2,0.13997440338134765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,32,power_law_1.01,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,32,power_law_1.2,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,4,power_law_1.2,0.1426367998123169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,32,power_law_1.01,0.043968001008033754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,32,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,4,power_law_1.2,0.1477311968803406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,32,power_law_1.01,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,32,power_law_1.2,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,4,power_law_1.2,0.15287679433822632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,32,power_law_1.01,0.04581120014190674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,32,power_law_1.2,0.04230400025844574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,4,power_law_1.2,0.15409280061721803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,32,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,32,power_law_1.2,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,4,power_law_1.2,0.15779199600219726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,32,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,32,power_law_1.2,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,32,power_law_1.01,0.057068800926208495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,32,power_law_1.2,0.0431551992893219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,4,power_law_1.2,0.16802560091018676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,32,power_law_1.2,0.04355199933052063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,32,power_law_1.01,0.059334397315979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,4,power_law_1.2,0.17089920043945311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,32,power_law_1.2,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,32,power_law_1.01,0.0683456003665924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,4,power_law_1.2,0.19219839572906494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,32,power_law_1.2,0.047014400362968445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.01,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,4,power_law_1.2,0.2089855909347534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,32,power_law_1.2,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.01,0.08573439717292786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,4,power_law_1.2,0.2233151912689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,32,power_law_1.2,0.054201602935791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.01,0.10722559690475464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,4,power_law_1.2,0.26590719223022463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,32,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.01,0.12813440561294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,4,power_law_1.2,0.29621760845184325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,32,power_law_1.2,0.06239359974861145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.01,0.14165760278701783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,4,power_law_1.2,0.3734463930130005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,32,power_law_1.2,0.07018240094184876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.01,0.19182080030441284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,4,power_law_1.2,0.4201216220855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.01,0.22684800624847412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.2,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,4,power_law_1.2,0.5731200218200684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.01,0.32371840476989744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.2,0.10396159887313842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,4,power_law_1.2,0.6937407970428466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.01,0.39969921112060547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.2,0.13714560270309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,4,power_law_1.2,0.9972672462463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,32,power_law_1.01,0.5543295860290527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.2,0.15905280113220216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,4,power_law_1.2,1.3403072357177734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,32,power_law_1.01,0.8768896102905274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.2,0.23278720378875734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.2,0.2600127935409546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,4,power_law_1.2,1.5301376342773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,32,power_law_1.01,1.4908736228942872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.2,0.47034878730773927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,4,power_law_1.2,2.547590446472168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.2,0.5383488178253174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,4,power_law_1.2,4.7379199981689455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,32,power_law_1.2,0.7670400142669678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,16,power_law_1.01,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,2,power_law_1.01,1.8909311294555664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,16,power_law_1.01,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,16,power_law_1.01,0.020614400506019592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,2,power_law_1.01,3.887583923339844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,16,power_law_1.01,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,16,power_law_1.2,0.0230335995554924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,16,power_law_1.01,0.023897600173950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,16,power_law_1.2,0.01973759979009628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,16,power_law_1.01,0.029625600576400755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,16,power_law_1.2,0.020576000213623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,16,power_law_1.01,0.05353599786758423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,16,power_law_1.01,0.030041599273681642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,16,power_law_1.2,0.021792000532150267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,16,power_law_1.01,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,16,power_law_1.01,0.03311359882354736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,16,power_law_1.2,0.02446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,16,power_law_1.01,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,16,power_law_1.01,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,16,power_law_1.2,0.028966400027275085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,16,power_law_1.01,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,16,power_law_1.01,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,16,power_law_1.2,0.029996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,16,power_law_1.01,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,16,power_law_1.01,0.04267520010471344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,16,power_law_1.2,0.03348479866981506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,16,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,16,power_law_1.01,0.04575999975204468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,16,power_law_1.2,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,16,power_law_1.01,0.042131200432777405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,16,power_law_1.01,0.045132800936698914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,16,power_law_1.2,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,16,power_law_1.01,0.042335999011993405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,16,power_law_1.01,0.04616959989070892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,16,power_law_1.2,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,16,power_law_1.01,0.04314880073070526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,16,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,16,power_law_1.2,0.03878400027751923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,16,power_law_1.01,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,16,power_law_1.01,0.04616959989070892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,16,power_law_1.2,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,16,power_law_1.01,0.04663679897785187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,16,power_law_1.01,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,16,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,16,power_law_1.01,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,16,power_law_1.2,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,16,power_law_1.01,0.0486272007226944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,16,power_law_1.01,0.06833279728889466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,16,power_law_1.01,0.049030399322509764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,16,power_law_1.2,0.05048959851264954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,16,power_law_1.01,0.08921599984169007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,16,power_law_1.2,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,16,power_law_1.01,0.04984959959983826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,16,power_law_1.01,0.10559999942779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,16,power_law_1.2,0.05969280004501343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,16,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,16,power_law_1.01,0.1588544011116028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,16,power_law_1.2,0.06951680183410644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,16,power_law_1.01,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,16,power_law_1.01,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,16,power_law_1.2,0.09735040068626404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,16,power_law_1.01,0.19694080352783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,16,power_law_1.01,0.07605760097503662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,16,power_law_1.2,0.1225600004196167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,16,power_law_1.01,0.2919359922409058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,16,power_law_1.01,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,16,power_law_1.2,0.16456320285797119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,16,power_law_1.01,0.36611840724945066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,16,power_law_1.01,0.09183359742164612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,16,power_law_1.2,0.2265984058380127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,16,power_law_1.01,0.5551487922668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,16,power_law_1.01,0.10616320371627808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,16,power_law_1.2,0.301145601272583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,16,power_law_1.01,0.7363903999328614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,16,power_law_1.01,0.1372928023338318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,16,power_law_1.2,0.42975358963012694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,16,power_law_1.01,0.9502016067504883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,16,power_law_1.01,0.15018880367279053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,16,power_law_1.2,0.6859392166137696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,16,power_law_1.01,1.5641983985900878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,16,power_law_1.01,0.2089855909347534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,16,power_law_1.2,0.8796992301940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,16,power_law_1.01,0.25731201171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,16,power_law_1.01,3.0901504516601563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,16,power_law_1.2,1.1796671867370605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,16,power_law_1.01,0.3394432067871094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,16,power_law_1.2,1.9858240127563476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,16,power_law_1.01,0.42626562118530276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,16,power_law_1.2,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,16,power_law_1.2,3.5162689208984377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,16,power_law_1.01,0.5235392093658447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,16,power_law_1.2,0.03882879912853241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,16,power_law_1.01,0.8178367614746094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,16,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,16,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,16,power_law_1.01,1.5768447875976563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,16,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,8,power_law_1.01,0.0201664000749588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,16,power_law_1.2,0.045414400100708005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,8,power_law_1.01,0.020160000026226043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,16,power_law_1.2,0.045407998561859134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,8,power_law_1.01,0.020147199928760528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,16,power_law_1.2,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,8,power_law_1.01,0.02078080028295517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,8,power_law_1.2,0.01973759979009628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,16,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,8,power_law_1.2,0.01932799965143204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,8,power_law_1.01,0.02160000056028366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,16,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,8,power_law_1.2,0.01932799965143204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,8,power_law_1.01,0.023443199694156647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,16,power_law_1.2,0.04807040095329285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,8,power_law_1.01,0.02651520073413849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,8,power_law_1.2,0.020147199928760528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,16,power_law_1.2,0.04847359955310822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,8,power_law_1.2,0.02096640020608902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,8,power_law_1.01,0.03142400085926056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,8,power_law_1.2,0.023839999735355378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,16,power_law_1.2,0.0494271993637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,8,power_law_1.01,0.03265919983386993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,8,power_law_1.2,0.026291200518608095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,8,power_law_1.01,0.035104000568389894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,16,power_law_1.2,0.051551997661590576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,8,power_law_1.2,0.03080959916114807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,8,power_law_1.01,0.04085119962692261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,16,power_law_1.2,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,8,power_law_1.01,0.03470079898834229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,16,power_law_1.2,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,8,power_law_1.2,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,8,power_law_1.01,0.03735679984092712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,16,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,8,power_law_1.2,0.035308799147605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,8,power_law_1.01,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,16,power_law_1.2,0.07672960162162781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,8,power_law_1.2,0.040217599272727965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,8,power_law_1.01,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,8,power_law_1.2,0.035308799147605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,16,power_law_1.2,0.084934401512146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,8,power_law_1.01,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,8,power_law_1.2,0.037350401282310486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,16,power_law_1.2,0.10561280250549317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,8,power_law_1.01,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,8,power_law_1.2,0.04348160028457641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,16,power_law_1.2,0.10807039737701415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,8,power_law_1.01,0.053548800945281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,8,power_law_1.2,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,16,power_law_1.2,0.1569983959197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,8,power_law_1.01,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,8,power_law_1.2,0.043699198961257936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,16,power_law_1.2,0.15578880310058593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,8,power_law_1.01,0.08303359746932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,8,power_law_1.2,0.05146239995956421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,16,power_law_1.2,0.2336064100265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,8,power_law_1.2,0.053523200750350955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,8,power_law_1.01,0.10247679948806762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,16,power_law_1.2,0.30467839241027833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,8,power_law_1.2,0.06725760102272034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,8,power_law_1.01,0.13608319759368898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,16,power_law_1.2,0.42284159660339354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,8,power_law_1.2,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,8,power_law_1.01,0.17231359481811523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,16,power_law_1.2,0.5285183906555175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,8,power_law_1.2,0.1018623948097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,8,power_law_1.01,0.23991680145263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,16,power_law_1.2,0.7646463871002197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,8,power_law_1.2,0.14302719831466676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,8,power_law_1.01,0.31281280517578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,16,power_law_1.2,1.2104703903198242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,8,power_law_1.2,0.16925439834594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,8,power_law_1.01,0.47318401336669924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,8,power_law_1.2,0.2646912097930908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,8,power_law_1.01,0.6325056076049804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,16,power_law_1.2,3.001273536682129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,8,power_law_1.2,0.34496641159057617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,8,power_law_1.01,0.7756608009338379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,8,power_law_1.2,0.464569616317749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,8,power_law_1.01,1.178502368927002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,8,power_law_1.2,0.6527743816375733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,8,power_law_1.01,0.046419200301170346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,8,power_law_1.01,2.397670364379883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,8,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,8,power_law_1.2,0.887059211730957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,8,power_law_1.01,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,8,power_law_1.2,1.26757755279541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,8,power_law_1.01,0.04273920059204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,8,power_law_1.2,2.889811134338379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,8,power_law_1.01,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,8,power_law_1.2,0.05252479910850525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,8,power_law_1.01,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,8,power_law_1.2,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,8,power_law_1.01,0.05072640180587769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,8,power_law_1.2,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,8,power_law_1.01,0.05134080052375793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,8,power_law_1.2,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,8,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,8,power_law_1.2,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,8,power_law_1.01,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,8,power_law_1.2,0.05080320239067078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,8,power_law_1.01,0.05399680137634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,8,power_law_1.2,0.050860798358917235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,32,power_law_1.01,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,8,power_law_1.01,0.05480319857597351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,8,power_law_1.2,0.052934402227401735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,32,power_law_1.01,0.037555199861526486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,8,power_law_1.01,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,8,power_law_1.2,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,32,power_law_1.01,0.03345920145511627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,8,power_law_1.01,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,8,power_law_1.2,0.0531391978263855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,32,power_law_1.01,0.04042240083217621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,8,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,8,power_law_1.2,0.054764801263809205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,32,power_law_1.01,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,8,power_law_1.01,0.06362879872322083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,8,power_law_1.2,0.055801600217819214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,32,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,8,power_law_1.01,0.06833279728889466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,8,power_law_1.2,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,32,power_law_1.01,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,8,power_law_1.01,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,32,power_law_1.01,0.06069759726524353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,8,power_law_1.01,0.08983680009841918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,32,power_law_1.01,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,8,power_law_1.01,0.10683519840240478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,32,power_law_1.01,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,8,power_law_1.01,0.11790080070495605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,32,power_law_1.01,0.09018880128860474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,8,power_law_1.01,0.14718079566955566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,32,power_law_1.01,0.10576640367507935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,8,power_law_1.01,0.17974400520324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,32,power_law_1.01,0.07832319736480713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,8,power_law_1.01,0.239136004447937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,32,power_law_1.01,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,32,power_law_1.01,0.11763199567794799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,8,power_law_1.01,0.3067199945449829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,32,power_law_1.01,0.08262400031089782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,8,power_law_1.01,0.4000959873199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,32,power_law_1.01,0.09919999837875366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,8,power_law_1.01,0.5096640110015869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,32,power_law_1.01,0.14343680143356324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,8,power_law_1.01,0.6946112155914307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.01,0.18561919927597045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,8,power_law_1.01,1.021446418762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.01,0.250764799118042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.01,0.33248000144958495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,8,power_law_1.01,1.705094337463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.01,0.5088128089904785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.01,0.6356607913970947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.01,0.9648320198059082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.01,1.2141440391540528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.01,1.9415807723999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.01,2.344825553894043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,1,32,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,1,32,power_law_1.2,0.028812798857688903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,32,power_law_1.01,3.2028865814208984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,1,32,power_law_1.2,0.03800959885120392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,32,power_law_1.01,5.486656188964844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,1,32,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,1,32,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,32,power_law_1.01,10.29208984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,1,32,power_law_1.2,0.047040000557899475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,32,power_law_1.2,1.3927680015563966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,1,32,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,1,32,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,32,power_law_1.2,3.053280067443848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,1,32,power_law_1.2,0.06833279728889466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,32,power_law_1.01,0.132806396484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,1,32,power_law_1.2,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,32,power_law_1.01,0.08118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,1,32,power_law_1.2,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,32,power_law_1.01,0.062745600938797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,1,32,power_law_1.2,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,1,32,power_law_1.2,0.1064255952835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,32,power_law_1.01,0.06766080260276794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,1,32,power_law_1.2,0.06853119730949402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,1,32,power_law_1.2,0.07919359803199769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,32,power_law_1.01,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,1,32,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,1,32,power_law_1.2,0.09579520225524903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,32,power_law_1.01,0.0838271975517273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,1,32,power_law_1.2,0.06648319959640503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,1,32,power_law_1.2,0.11523200273513794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,32,power_law_1.01,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,1,32,power_law_1.2,0.06913920044898987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,1,32,power_law_1.2,0.0873856008052826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,32,power_law_1.01,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,1,32,power_law_1.2,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,1,32,power_law_1.2,0.1060096025466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,32,power_law_1.01,0.08568320274353028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,1,32,power_law_1.2,0.08328319787979126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,32,power_law_1.01,0.08240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,1,32,power_law_1.2,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,1,32,power_law_1.2,0.08533120155334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,32,power_law_1.01,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.2,0.18343039751052856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,1,32,power_law_1.2,0.08494719862937927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,32,power_law_1.01,0.0899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.2,0.27784318923950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,1,32,power_law_1.2,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,32,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.2,0.3689856052398682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,1,32,power_law_1.2,0.08696320056915283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,32,power_law_1.01,0.09183359742164612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.2,0.5272704124450683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,1,32,power_law_1.2,0.09085440039634704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,32,power_law_1.01,0.10043519735336304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.2,0.6974720001220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,1,32,power_law_1.2,0.0871616005897522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,32,power_law_1.01,0.09797120094299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.2,1.0243519783020019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,1,32,power_law_1.2,0.08983680009841918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,32,power_law_1.01,0.10145920515060425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.2,1.4148863792419433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,1,32,power_law_1.2,0.09721599817276001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,32,power_law_1.01,0.11701760292053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.2,2.0485567092895507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,1,32,power_law_1.2,0.10151679515838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.01,0.1381183981895447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.2,2.9381887435913088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,1,32,power_law_1.2,0.11175040006637574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.01,0.16085120439529418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,1,32,power_law_1.2,0.1256767988204956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,1,32,power_law_1.2,3.7536895751953123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.01,0.16104960441589355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.2,0.1352895975112915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.01,0.21183359622955322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,1,32,power_law_1.2,6.388652801513672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.2,0.1742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.01,0.2605760097503662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.2,0.19941120147705077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.01,0.3302144050598145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,1,32,power_law_1.2,12.911129760742188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.2,0.2507967948913574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.01,0.4151360034942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.2,0.2886912107467651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.01,0.5968639850616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.2,0.36569600105285643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.01,0.7658239841461182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.2,0.46789121627807617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,16,power_law_1.01,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,32,power_law_1.01,0.9366208076477051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.2,0.8109375953674316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,16,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,32,power_law_1.01,1.5276479721069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.2,1.24203519821167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,16,power_law_1.01,0.02512640058994293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,16,power_law_1.01,0.02655999958515167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,1,32,power_law_1.2,1.2420415878295898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,32,power_law_1.01,2.899628829956055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,16,power_law_1.01,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,1,32,power_law_1.2,1.8422847747802735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,16,power_law_1.01,0.04397439956665039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,16,power_law_1.01,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,1,32,power_law_1.2,4.854438400268554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,16,power_law_1.01,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,16,power_law_1.2,0.03612160086631775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,16,power_law_1.01,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,16,power_law_1.2,0.024249599874019624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,16,power_law_1.01,0.06547840237617493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,16,power_law_1.2,0.026495999097824095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,16,power_law_1.01,0.11215360164642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,16,power_law_1.01,0.07571200132369996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,16,power_law_1.2,0.02690559923648834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,16,power_law_1.01,0.07858560085296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,16,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,16,power_law_1.2,0.03570559918880463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,16,power_law_1.01,0.05707520246505737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,16,power_law_1.01,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,16,power_law_1.2,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,16,power_law_1.01,0.06525440216064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,16,power_law_1.01,0.0810368001461029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,16,power_law_1.2,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,16,power_law_1.01,0.06814079880714416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,16,power_law_1.01,0.09189760088920593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,16,power_law_1.2,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,16,power_law_1.01,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,16,power_law_1.01,0.07203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,16,power_law_1.2,0.056806397438049314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,16,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,16,power_law_1.01,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,16,power_law_1.2,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,16,power_law_1.01,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,16,power_law_1.01,0.10663679838180543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,16,power_law_1.2,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,16,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,16,power_law_1.01,0.08492159843444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,16,power_law_1.01,0.13244800567626952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,16,power_law_1.2,0.09017599821090698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,16,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,16,power_law_1.2,0.0695039987564087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,16,power_law_1.01,0.1883520007133484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,16,power_law_1.01,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,16,power_law_1.2,0.07954559922218322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,16,power_law_1.01,0.23259520530700684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,16,power_law_1.01,0.09189119935035706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,16,power_law_1.2,0.09591680169105529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,16,power_law_1.01,0.3528064012527466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,16,power_law_1.01,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,16,power_law_1.2,0.07339519858360291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,16,power_law_1.01,0.44332160949707033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,16,power_law_1.01,0.09925119876861573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,16,power_law_1.2,0.08957440257072449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,16,power_law_1.01,0.6475008010864258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,16,power_law_1.01,0.10068479776382447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,16,power_law_1.2,0.1090432047843933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,16,power_law_1.01,0.8187264442443848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,16,power_law_1.01,0.1060096025466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,16,power_law_1.2,0.13893120288848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,16,power_law_1.01,1.2088512420654296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,16,power_law_1.01,0.12117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,16,power_law_1.2,0.1897279977798462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,16,power_law_1.01,1.7059200286865235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,16,power_law_1.01,0.13466880321502686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,16,power_law_1.2,0.24522240161895753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,16,power_law_1.01,2.162816047668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,16,power_law_1.01,0.16499840021133422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,16,power_law_1.2,0.36462719440460206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,16,power_law_1.01,0.1707327961921692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,16,power_law_1.01,3.443423843383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,16,power_law_1.2,0.44858241081237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,16,power_law_1.01,0.20923519134521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,16,power_law_1.2,0.6920896053314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,16,power_law_1.01,6.847219085693359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,16,power_law_1.01,0.2430272102355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,16,power_law_1.2,0.9255104064941406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,16,power_law_1.01,0.3413183927536011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,16,power_law_1.2,1.3554304122924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,16,power_law_1.01,0.41588478088378905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,16,power_law_1.2,1.6964351654052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,16,power_law_1.2,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,16,power_law_1.01,0.5391615867614746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,16,power_law_1.2,2.2553279876708983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,16,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,16,power_law_1.01,0.7384384155273438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,16,power_law_1.2,3.8392574310302736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,16,power_law_1.2,0.06177279949188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,16,power_law_1.01,0.8690879821777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,16,power_law_1.2,0.0652671992778778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,16,power_law_1.2,7.555769348144532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,16,power_law_1.01,1.4222463607788085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,16,power_law_1.2,0.06773759722709656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,16,power_law_1.2,0.07836800217628478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,16,power_law_1.01,2.6295488357543944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,16,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,16,power_law_1.2,0.08247039914131164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,16,power_law_1.2,0.08389120101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,8,power_law_1.01,0.026284798979759216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,16,power_law_1.2,0.08985599875450134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,8,power_law_1.2,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,8,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,16,power_law_1.2,0.09229440093040467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,8,power_law_1.2,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,8,power_law_1.01,0.02876160144805908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,16,power_law_1.2,0.09066240191459655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,8,power_law_1.2,0.024505600333213806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,8,power_law_1.01,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,16,power_law_1.2,0.09248639941215515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,8,power_law_1.2,0.02449920028448105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,8,power_law_1.01,0.0409855991601944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,16,power_law_1.2,0.09598079919815064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,8,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,8,power_law_1.01,0.04309119880199432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,16,power_law_1.2,0.1017151951789856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,8,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,8,power_law_1.01,0.04799999892711639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,16,power_law_1.2,0.10313600301742554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,8,power_law_1.2,0.03882879912853241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,8,power_law_1.01,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,16,power_law_1.2,0.11092480421066284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,8,power_law_1.2,0.047007998824119566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,8,power_law_1.01,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,8,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,8,power_law_1.2,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,8,power_law_1.01,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,16,power_law_1.2,0.13018879890441895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,8,power_law_1.2,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,8,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,8,power_law_1.01,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,16,power_law_1.2,0.14657280445098878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,8,power_law_1.2,0.06972159743309021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,8,power_law_1.2,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,8,power_law_1.01,0.07503359913825988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,16,power_law_1.2,0.16254719495773315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,8,power_law_1.2,0.07526400089263915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,8,power_law_1.2,0.07486720085144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,8,power_law_1.01,0.06968960165977478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,16,power_law_1.2,0.18343679904937743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,8,power_law_1.2,0.08712319731712341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,8,power_law_1.2,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,8,power_law_1.01,0.07114880084991455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,16,power_law_1.2,0.2334144115447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,8,power_law_1.2,0.09633920192718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,8,power_law_1.2,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,8,power_law_1.01,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,16,power_law_1.2,0.2718976020812988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,8,power_law_1.2,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,8,power_law_1.2,0.07936000227928161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,8,power_law_1.01,0.076883202791214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,16,power_law_1.2,0.3739007949829102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,8,power_law_1.2,0.1344383955001831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,8,power_law_1.2,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,8,power_law_1.01,0.07995520234107971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,16,power_law_1.2,0.4756864070892334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,8,power_law_1.2,0.17294080257415773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,8,power_law_1.2,0.07672320008277893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,8,power_law_1.01,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,16,power_law_1.2,0.6995264053344726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,8,power_law_1.2,0.2179840087890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,8,power_law_1.2,0.09330559968948364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,8,power_law_1.01,0.11066880226135253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,8,power_law_1.2,0.27514240741729734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,16,power_law_1.2,0.8314175605773926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,8,power_law_1.2,0.11338880062103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,8,power_law_1.01,0.14137599468231202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,8,power_law_1.2,0.3568511962890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,16,power_law_1.2,1.1363712310791017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,8,power_law_1.2,0.1539199948310852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,8,power_law_1.01,0.17990399599075318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,8,power_law_1.2,0.5317567825317383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,8,power_law_1.2,0.19264639616012574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,16,power_law_1.2,1.859110450744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,8,power_law_1.01,0.24563839435577392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,8,power_law_1.2,0.7150464057922363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,8,power_law_1.2,0.272710394859314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,8,power_law_1.01,0.31423358917236327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,16,power_law_1.2,3.6906238555908204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,8,power_law_1.2,0.9095999717712402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,8,power_law_1.2,0.3548543930053711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,8,power_law_1.01,0.45310077667236326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,8,power_law_1.2,1.4308095932006837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,8,power_law_1.2,0.5207104206085205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,8,power_law_1.01,0.600544023513794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,8,power_law_1.2,0.6868159770965576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,8,power_law_1.01,0.8858431816101074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,8,power_law_1.2,3.023731231689453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,8,power_law_1.2,1.019820785522461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,8,power_law_1.01,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,8,power_law_1.01,1.1522815704345704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,8,power_law_1.01,0.07838720083236694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,8,power_law_1.2,1.349343967437744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,8,power_law_1.01,1.4225728034973144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,8,power_law_1.01,0.06117119789123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,8,power_law_1.2,1.682156753540039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,8,power_law_1.01,2.3251840591430666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,8,power_law_1.2,0.08936960101127625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,8,power_law_1.01,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,8,power_law_1.2,2.684441566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,8,power_law_1.2,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,8,power_law_1.01,0.07486079931259156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,8,power_law_1.01,4.5675201416015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,8,power_law_1.2,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,8,power_law_1.01,0.0908415973186493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,8,power_law_1.2,5.32940788269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,8,power_law_1.2,0.07011200189590454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,8,power_law_1.01,0.09290239810943604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,8,power_law_1.2,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,8,power_law_1.01,0.09413759708404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,8,power_law_1.2,0.0902079999446869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,8,power_law_1.01,0.09783040285110474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,32,power_law_1.01,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,8,power_law_1.2,0.09102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,8,power_law_1.01,0.09698560237884521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,32,power_law_1.2,0.09986559748649597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,32,power_law_1.01,0.11845760345458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,8,power_law_1.01,0.09943680167198181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,8,power_law_1.2,0.0946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,32,power_law_1.2,0.11584639549255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,32,power_law_1.01,0.1120959997177124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,8,power_law_1.2,0.09799039959907532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,8,power_law_1.01,0.09947519898414611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,32,power_law_1.2,0.09700480103492737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,32,power_law_1.01,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,8,power_law_1.2,0.09733759760856628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,8,power_law_1.01,0.10027519464492798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,32,power_law_1.2,0.07323520183563233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,32,power_law_1.01,0.07992320060729981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,8,power_law_1.2,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,8,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,32,power_law_1.2,0.08798720240592957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,32,power_law_1.01,0.09390720129013061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,8,power_law_1.2,0.10392320156097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,8,power_law_1.01,0.11074559688568116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,8,power_law_1.2,0.10188159942626954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,8,power_law_1.01,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,32,power_law_1.2,0.08655999898910523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,32,power_law_1.01,0.09589759707450866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,8,power_law_1.2,0.10842239856719971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,8,power_law_1.01,0.11951999664306641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,32,power_law_1.01,0.10371840000152588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,8,power_law_1.2,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,8,power_law_1.01,0.13715200424194335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,32,power_law_1.01,0.10635520219802856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,8,power_law_1.2,0.12174079418182374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,8,power_law_1.01,0.15374720096588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,32,power_law_1.01,0.11353600025177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,8,power_law_1.2,0.12664320468902587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,8,power_law_1.01,0.17728639841079713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,8,power_law_1.2,0.14507520198822021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,32,power_law_1.01,0.10779520273208618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,8,power_law_1.01,0.19367040395736695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,8,power_law_1.2,0.1596351981163025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,8,power_law_1.01,0.23915519714355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,32,power_law_1.01,0.11025279760360718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,8,power_law_1.2,0.18277759552001954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,8,power_law_1.01,0.28377599716186525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,32,power_law_1.01,0.11518080234527588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,8,power_law_1.2,0.20571520328521728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,8,power_law_1.01,0.3861632108688354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,32,power_law_1.01,0.11720960140228272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,8,power_law_1.2,0.2530112028121948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,8,power_law_1.01,0.48222718238830564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,32,power_law_1.01,0.12009600400924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,8,power_law_1.2,0.31548800468444826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,8,power_law_1.01,0.7060863971710205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,32,power_law_1.01,0.12460800409317016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,8,power_law_1.2,0.4258687973022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,8,power_law_1.01,0.8621312141418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,32,power_law_1.01,0.12747520208358765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,8,power_law_1.2,0.530515193939209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,8,power_law_1.01,1.0913087844848632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,32,power_law_1.01,0.14302719831466676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,8,power_law_1.2,0.7121791839599609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,8,power_law_1.01,1.7022335052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,32,power_law_1.01,0.15408639907836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,8,power_law_1.2,1.0814080238342285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,32,power_law_1.01,0.18645119667053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,8,power_law_1.2,1.1248512268066406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,8,power_law_1.01,3.320083236694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,32,power_law_1.01,0.21184000968933106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,8,power_law_1.2,1.9955904006958007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,32,power_law_1.01,0.26263039112091063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,8,power_law_1.2,4.829260635375976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,32,power_law_1.01,0.3017600059509277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,16,power_law_1.01,0.07631999850273133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,32,power_law_1.01,0.3851072072982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,16,power_law_1.01,0.10888320207595825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,32,power_law_1.01,0.47521281242370605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,16,power_law_1.01,0.12855039834976195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,16,power_law_1.2,0.09470080137252808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,32,power_law_1.01,0.6572800159454346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,16,power_law_1.01,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,16,power_law_1.2,0.10802559852600098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,32,power_law_1.01,0.8256256103515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,16,power_law_1.01,0.0775488018989563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,16,power_law_1.2,0.09327359795570374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,32,power_law_1.01,0.9796416282653808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,16,power_law_1.01,0.0955839991569519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,16,power_law_1.2,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,16,power_law_1.01,0.09742079973220825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,32,power_law_1.01,1.5428223609924316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,16,power_law_1.2,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,16,power_law_1.01,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,16,power_law_1.2,0.0934656023979187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,32,power_law_1.01,2.9479551315307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,16,power_law_1.01,0.10888960361480712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,16,power_law_1.2,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,16,power_law_1.01,0.10806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,16,power_law_1.2,0.1074112057685852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,16,power_law_1.01,0.11296000480651855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,16,power_law_1.2,0.11007360219955445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,8,power_law_1.01,0.08199679851531982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,16,power_law_1.2,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,16,power_law_1.01,0.11893119812011718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,8,power_law_1.01,0.09204480051994324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,16,power_law_1.01,0.1174847960472107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,16,power_law_1.2,0.1123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,8,power_law_1.01,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,16,power_law_1.01,0.11708159446716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,16,power_law_1.2,0.11806080341339112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,8,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,16,power_law_1.2,0.11539839506149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,16,power_law_1.01,0.1271232008934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,8,power_law_1.01,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,16,power_law_1.2,0.12584320306777955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,16,power_law_1.01,0.13653119802474975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,8,power_law_1.01,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,16,power_law_1.2,0.13115520477294923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,16,power_law_1.01,0.1400256037712097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,8,power_law_1.01,0.10965119600296021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,16,power_law_1.2,0.1350592017173767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,16,power_law_1.01,0.1568127989768982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,16,power_law_1.2,0.1414080023765564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,8,power_law_1.01,0.12378239631652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,16,power_law_1.01,0.1715648055076599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,16,power_law_1.2,0.15656319856643677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,8,power_law_1.01,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,16,power_law_1.01,0.20288639068603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,16,power_law_1.2,0.17479039430618287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,8,power_law_1.01,0.12767360210418702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,16,power_law_1.01,0.22645120620727538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,16,power_law_1.2,0.20120320320129395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,8,power_law_1.01,0.13013119697570802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,16,power_law_1.01,0.2805183887481689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,16,power_law_1.2,0.23519999980926515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,8,power_law_1.01,0.13217920064926147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,16,power_law_1.01,0.30877439975738524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,16,power_law_1.2,0.292742395401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,8,power_law_1.01,0.140556800365448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,16,power_law_1.01,0.40052480697631837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,8,power_law_1.01,0.14057600498199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,16,power_law_1.2,0.3260799884796143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,16,power_law_1.01,0.49329280853271484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,8,power_law_1.01,0.1538879990577698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,16,power_law_1.2,0.4190847873687744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,16,power_law_1.01,0.6626495838165283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,8,power_law_1.01,0.15326720476150513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,16,power_law_1.2,0.5485504150390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,16,power_law_1.01,0.8965439796447754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,8,power_law_1.01,0.16145919561386107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,16,power_law_1.2,0.745363187789917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,16,power_law_1.01,1.049721622467041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,8,power_law_1.01,0.18398720026016235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,16,power_law_1.2,0.9591744422912598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,16,power_law_1.01,1.6293184280395507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,8,power_law_1.01,0.19688960313796997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,16,power_law_1.2,1.2239551544189453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,16,power_law_1.01,3.2537921905517577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,8,power_law_1.01,0.23293440341949462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,16,power_law_1.2,1.9088127136230468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,8,power_law_1.01,0.2634495973587036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,8,power_law_1.01,0.33471999168395994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,16,power_law_1.2,3.815852737426758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,8,power_law_1.01,0.36401278972625734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,8,power_law_1.2,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,8,power_law_1.01,0.4760447978973389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,8,power_law_1.2,0.08759679794311523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,8,power_law_1.01,0.575974416732788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,8,power_law_1.2,0.07858560085296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,8,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,8,power_law_1.01,0.8100671768188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,4,power_law_1.01,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,8,power_law_1.2,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,4,power_law_1.01,0.08732799887657165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,8,power_law_1.01,1.0111807823181151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,4,power_law_1.01,0.10884480476379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,8,power_law_1.2,0.10008959770202637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,8,power_law_1.01,1.2292927742004394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,4,power_law_1.01,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,8,power_law_1.2,0.10478719472885131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,8,power_law_1.01,1.9399423599243164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,4,power_law_1.01,0.09819520115852357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,8,power_law_1.2,0.12014720439910889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,8,power_law_1.01,3.5576576232910155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,4,power_law_1.01,0.1192896008491516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,8,power_law_1.2,0.12464640140533448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,4,power_law_1.01,0.13915519714355468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,8,power_law_1.2,0.12691199779510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,4,power_law_1.01,0.15410560369491577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,8,power_law_1.2,0.12833919525146484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,4,power_law_1.01,0.15900800228118897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,8,power_law_1.2,0.13284480571746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,4,power_law_1.2,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,4,power_law_1.01,0.16475520133972169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,8,power_law_1.2,0.1410367965698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,4,power_law_1.2,0.09348480105400085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,4,power_law_1.01,0.16883200407028198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,8,power_law_1.2,0.14636160135269166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,4,power_law_1.2,0.08957440257072449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,4,power_law_1.01,0.18153599500656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,8,power_law_1.2,0.15025919675827026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,4,power_law_1.2,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,4,power_law_1.01,0.17580800056457518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,8,power_law_1.2,0.15763839483261108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,4,power_law_1.01,0.19158400297164918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,4,power_law_1.2,0.09900799989700318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,8,power_law_1.2,0.1684991955757141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,4,power_law_1.01,0.19854719638824464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,8,power_law_1.2,0.19264639616012574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,4,power_law_1.2,0.11578880548477173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,4,power_law_1.01,0.20366079807281495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,8,power_law_1.2,0.20984320640563964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,4,power_law_1.2,0.1350399971008301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,4,power_law_1.2,0.1561344027519226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,4,power_law_1.01,0.21799681186676026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,8,power_law_1.2,0.2399616003036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,4,power_law_1.01,0.244979190826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,4,power_law_1.2,0.1637120008468628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,8,power_law_1.2,0.26474881172180176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,4,power_law_1.01,0.2575040102005005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,4,power_law_1.2,0.15859839916229249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,8,power_law_1.2,0.3312959909439087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,4,power_law_1.01,0.3124160051345825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,4,power_law_1.2,0.16556160449981688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,8,power_law_1.2,0.3804480075836182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,4,power_law_1.01,0.34250240325927733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,4,power_law_1.2,0.17456640005111695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,8,power_law_1.2,0.5023104190826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,4,power_law_1.01,0.4129727840423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,4,power_law_1.2,0.18439680337905884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,8,power_law_1.2,0.5850560188293457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,4,power_law_1.01,0.48014078140258787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,4,power_law_1.2,0.1970944046974182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,8,power_law_1.2,0.896947193145752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,4,power_law_1.01,0.6140736103057861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,4,power_law_1.2,0.20283520221710205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,8,power_law_1.2,1.0683712005615233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,4,power_law_1.2,0.20692479610443115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,4,power_law_1.01,0.7523071765899658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,8,power_law_1.2,1.3567296028137208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,4,power_law_1.2,0.21777920722961425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,4,power_law_1.01,1.0496767997741698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,8,power_law_1.2,2.067795181274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,4,power_law_1.2,0.25566720962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,4,power_law_1.01,1.3046591758728028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,4,power_law_1.2,0.2630399942398071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,8,power_law_1.2,3.9716159820556642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,4,power_law_1.01,1.6314111709594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,4,power_law_1.2,0.3117824077606201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,4,power_law_1.01,2.3734912872314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,4,power_law_1.2,0.354585599899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,4,power_law_1.2,0.4350719928741455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,4,power_law_1.01,4.782508850097656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,4,power_law_1.2,0.49118719100952146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,4,power_law_1.2,0.6600704193115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,2,power_law_1.01,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,4,power_law_1.2,0.7854911804199218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,2,power_law_1.01,0.09516159892082214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,4,power_law_1.2,1.1584383964538574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,2,power_law_1.01,0.1091007947921753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,4,power_law_1.2,1.3513471603393554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,2,power_law_1.2,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,2,power_law_1.01,0.10561280250549317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,4,power_law_1.2,1.6612159729003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,32,power_law_1.2,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,2,power_law_1.2,0.09674879908561707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,2,power_law_1.01,0.13367680311203003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,32,power_law_1.2,0.09781119823455811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,4,power_law_1.2,2.6044992446899413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,2,power_law_1.2,0.10045440196990967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,2,power_law_1.01,0.16458879709243773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,32,power_law_1.2,0.10519039630889893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,2,power_law_1.2,0.1074112057685852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,2,power_law_1.01,0.18588160276412963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,32,power_law_1.2,0.10498559474945068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,4,power_law_1.2,4.923257446289062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,2,power_law_1.2,0.12748160362243652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,2,power_law_1.01,0.2264319896697998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,32,power_law_1.2,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,2,power_law_1.2,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,2,power_law_1.01,0.2356544017791748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,32,power_law_1.2,0.11009279489517212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,2,power_law_1.2,0.18134399652481079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,2,power_law_1.01,0.2457024097442627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,32,power_law_1.2,0.11248639822006226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,2,power_law_1.2,0.2186176061630249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,2,power_law_1.01,0.25797119140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,32,power_law_1.2,0.11072640419006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,2,power_law_1.2,0.23111040592193605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,2,power_law_1.01,0.2608511924743652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,32,power_law_1.2,0.12013440132141114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,2,power_law_1.2,0.23868160247802733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,2,power_law_1.01,0.27149438858032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,32,power_law_1.2,0.12199039459228515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,2,power_law_1.2,0.24955520629882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,32,power_law_1.2,0.1289471983909607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,2,power_law_1.01,0.27968640327453614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,2,power_law_1.01,0.3048896074295044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,32,power_law_1.2,0.14533120393753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,2,power_law_1.01,0.29688320159912107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,32,power_law_1.2,0.16744320392608641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,2,power_law_1.01,0.3302720069885254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,32,power_law_1.2,0.20432639122009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,2,power_law_1.01,0.36815359592437746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,32,power_law_1.2,0.21271679401397706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,power_law_1.01,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,2,power_law_1.01,0.4070784091949463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,32,power_law_1.2,0.2788671970367432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,power_law_1.01,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,2,power_law_1.01,0.48224639892578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,32,power_law_1.2,0.30344319343566895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,power_law_1.01,0.034892800450325015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,2,power_law_1.01,0.5420351982116699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,32,power_law_1.2,0.4119679927825928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,power_law_1.01,0.036339199542999266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,2,power_law_1.01,0.6556992053985595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,power_law_1.01,0.044512000679969785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,32,power_law_1.2,0.5055744171142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,power_law_1.01,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,2,power_law_1.01,0.7413119792938232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,32,power_law_1.2,0.7138432025909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,2,power_law_1.01,0.9551039695739746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,32,power_law_1.2,0.9358528137207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,power_law_1.01,0.0406143993139267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,2,power_law_1.01,1.1511167526245116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,32,power_law_1.2,1.1814208030700684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,power_law_1.01,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,power_law_1.01,0.041043201088905336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,2,power_law_1.01,1.542470359802246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,32,power_law_1.2,2.0440448760986327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,power_law_1.01,0.043296000361442565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,2,power_law_1.01,1.9731775283813477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,power_law_1.01,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,32,power_law_1.2,3.6705535888671874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,power_law_1.01,0.053324800729751584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,2,power_law_1.01,2.4157184600830077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,power_law_1.01,0.062745600938797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,2,power_law_1.01,3.727084732055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,power_law_1.01,0.07728639841079712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,power_law_1.01,0.08240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,power_law_1.01,0.09962239861488342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,2,power_law_1.01,7.332390594482422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,power_law_1.01,0.11763199567794799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,power_law_1.01,0.16965759992599488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,power_law_1.01,0.18153599500656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,power_law_1.01,0.2437824010848999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,power_law_1.01,0.33533439636230467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,power_law_1.01,0.4506368160247803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,power_law_1.01,0.7068416118621826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,power_law_1.01,0.8792832374572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,power_law_1.01,1.3517696380615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,power_law_1.01,2.443065643310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,power_law_1.2,0.036582401394844054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,power_law_1.2,0.037401598691940305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,power_law_1.2,0.03413119912147522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,power_law_1.2,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,power_law_1.2,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,power_law_1.01,0.03187200129032135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,power_law_1.01,0.03208959996700287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,power_law_1.2,0.04026240110397339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,power_law_1.01,0.031673601269721983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,power_law_1.2,0.039238399267196654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,power_law_1.01,0.03310079872608185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,power_law_1.2,0.04456959962844849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,power_law_1.01,0.04092159867286682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,power_law_1.2,0.04784640073776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,power_law_1.01,0.04560000002384186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,power_law_1.2,0.04725759923458099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,power_law_1.01,0.03454720079898834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,power_law_1.2,0.055219197273254396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,power_law_1.01,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,power_law_1.2,0.057894402742385866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,power_law_1.2,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,power_law_1.01,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,power_law_1.2,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,power_law_1.2,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,power_law_1.01,0.03885439932346344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,power_law_1.2,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,power_law_1.2,0.031615999341011045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,power_law_1.01,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,power_law_1.2,0.08389120101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,power_law_1.2,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,power_law_1.01,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,power_law_1.2,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,power_law_1.2,0.03325439989566803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,power_law_1.2,0.11707520484924316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,power_law_1.2,0.04141440093517303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,power_law_1.01,0.053600001335144046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,power_law_1.2,0.15207040309906006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,power_law_1.2,0.04718720018863678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,power_law_1.01,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,power_law_1.2,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,power_law_1.2,0.18628480434417724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,power_law_1.01,0.06321920156478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,power_law_1.2,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,power_law_1.2,0.2737407922744751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,power_law_1.01,0.08327680230140685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,power_law_1.2,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,power_law_1.2,0.35012478828430177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,power_law_1.2,0.03877759873867035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,power_law_1.2,0.5543168067932129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,power_law_1.01,0.09229440093040467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,power_law_1.2,0.0412416011095047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,power_law_1.2,0.6974720001220703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,power_law_1.01,0.10561280250549317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,power_law_1.2,0.0414463996887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,power_law_1.2,0.9284799575805665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,power_law_1.01,0.13162879943847655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,power_law_1.2,0.047993600368499756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,power_law_1.2,1.4431488037109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,power_law_1.01,0.16787840127944947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,power_law_1.2,0.05516800284385681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,power_law_1.2,2.9041919708251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,power_law_1.01,0.20533759593963624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,power_law_1.2,0.060288000106811526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,power_law_1.01,0.31081600189208985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,power_law_1.2,0.0602944016456604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,power_law_1.2,0.07708799839019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,power_law_1.01,0.4863232135772705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,power_law_1.2,0.07707520127296448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,power_law_1.01,0.5203199863433838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,power_law_1.2,0.10104320049285889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,power_law_1.01,0.6995327949523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,power_law_1.2,0.10862720012664795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,power_law_1.01,1.0079360008239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,power_law_1.2,0.1575551986694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,power_law_1.01,2.1116287231445314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,power_law_1.2,0.1913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,power_law_1.2,0.24543359279632568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,power_law_1.2,0.34415359497070314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,power_law_1.2,0.4711103916168213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,power_law_1.2,0.674393606185913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,power_law_1.2,0.8182527542114257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,power_law_1.2,1.2977024078369142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,power_law_1.2,2.594233512878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,power_law_1.01,0.02961919903755188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,power_law_1.01,0.029420799016952513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,power_law_1.01,0.03023360073566437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,power_law_1.01,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,power_law_1.01,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,power_law_1.01,0.045407998561859134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,power_law_1.01,0.03514240086078644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,power_law_1.01,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,power_law_1.2,0.029420799016952513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,power_law_1.01,0.036595198512077334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,power_law_1.2,0.030035200715065002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,power_law_1.2,0.030035200715065002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,power_law_1.01,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,power_law_1.2,0.03208320140838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,power_law_1.01,0.039443200826644896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,power_law_1.2,0.04275839924812317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,power_law_1.01,0.04863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,power_law_1.2,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,power_law_1.2,0.035571199655532834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,power_law_1.2,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,power_law_1.2,0.037011200189590455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,power_law_1.2,0.03885439932346344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,power_law_1.2,0.04151679873466492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,power_law_1.01,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,power_law_1.2,0.04683519899845123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,power_law_1.01,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,power_law_1.2,0.055852800607681274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,power_law_1.01,0.06353920102119445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,power_law_1.2,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,power_law_1.01,0.04451839923858643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,power_law_1.2,0.0744704008102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,power_law_1.01,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,power_law_1.2,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,power_law_1.01,0.045977601408958436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,power_law_1.2,0.08882560133934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,power_law_1.01,0.04657920002937317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,power_law_1.2,0.10335999727249146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,power_law_1.01,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,power_law_1.2,0.14472960233688353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,power_law_1.01,0.04062080085277557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,power_law_1.01,0.045132800936698914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,power_law_1.2,0.16234879493713378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,power_law_1.01,0.044537600874900815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,power_law_1.2,0.19552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,power_law_1.01,0.05434880256652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,power_law_1.2,0.27149438858032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,power_law_1.01,0.05575680136680603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,power_law_1.2,0.4111807823181152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,power_law_1.2,0.576038408279419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,power_law_1.01,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,power_law_1.2,0.7249279975891113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,power_law_1.2,1.1543999671936036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,power_law_1.01,0.07504000067710877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,power_law_1.2,2.119808006286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,power_law_1.01,0.10453120470046998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,power_law_1.01,0.10657279491424561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,power_law_1.01,0.11866879463195801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,power_law_1.01,0.16330879926681519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,power_law_1.01,0.2130687952041626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,power_law_1.01,0.29418239593505857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,power_law_1.01,0.409881591796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,power_law_1.01,0.4952832221984863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,2,power_law_1.2,0.2581439971923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,power_law_1.01,0.7817984104156495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,2,power_law_1.2,0.2694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,power_law_1.01,1.1526911735534668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,2,power_law_1.2,0.2767807960510254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,power_law_1.01,1.4643327713012695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,power_law_1.01,2.1295936584472654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,2,power_law_1.2,0.29459199905395506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,power_law_1.01,4.233491134643555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,2,power_law_1.2,0.2990783929824829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,2,power_law_1.2,0.33228158950805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,2,power_law_1.2,0.3611135959625244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,2,power_law_1.2,0.4088768005371094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,2,power_law_1.2,0.47277441024780276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,2,power_law_1.2,0.5280576229095459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,2,power_law_1.2,0.6572991847991944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,2,power_law_1.2,0.7515071868896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,2,power_law_1.2,1.0206015586853028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,power_law_1.2,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,2,power_law_1.2,1.188748836517334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,power_law_1.2,0.06528000235557556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,2,power_law_1.2,1.6292608261108399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,power_law_1.2,0.050323200225830075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,power_law_1.2,0.05132799744606018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,2,power_law_1.2,2.1052160263061523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,power_law_1.2,0.06668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,2,power_law_1.2,2.563155174255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,power_law_1.2,0.04764800071716309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,power_law_1.2,0.05113599896430969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,2,power_law_1.2,3.8593280792236326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,power_law_1.2,0.043558400869369504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,2,power_law_1.2,7.531597137451172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,power_law_1.2,0.05379840135574341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,power_law_1.2,0.05316479802131653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,power_law_1.2,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,power_law_1.01,0.044915199279785156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,power_law_1.2,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,power_law_1.01,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,power_law_1.2,0.07530879974365234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,power_law_1.01,0.03797119855880737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,power_law_1.2,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,power_law_1.01,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,power_law_1.2,0.10643839836120605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,power_law_1.01,0.038796800374984744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,power_law_1.2,0.1082751989364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,power_law_1.01,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,power_law_1.2,0.1265023946762085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,power_law_1.01,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,power_law_1.2,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,power_law_1.01,0.04471679925918579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,power_law_1.01,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,power_law_1.2,0.2379136085510254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,power_law_1.01,0.044326400756835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,power_law_1.2,0.2706815958023071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,power_law_1.01,0.0488319993019104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,power_law_1.2,0.4511040210723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,power_law_1.01,0.052313601970672606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,power_law_1.2,0.5510591983795166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,power_law_1.2,0.8463744163513184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,power_law_1.01,0.066048002243042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,power_law_1.2,1.181817626953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,power_law_1.01,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,power_law_1.2,1.4937408447265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,power_law_1.01,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,power_law_1.2,2.17838077545166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,power_law_1.01,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,power_law_1.01,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,power_law_1.2,4.635987091064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,power_law_1.01,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,power_law_1.01,0.11436159610748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,power_law_1.01,0.14180480241775512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,power_law_1.01,0.1987391948699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,power_law_1.01,0.21470720767974855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,power_law_1.2,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,power_law_1.01,0.31179521083831785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,power_law_1.2,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,power_law_1.01,0.40887041091918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,power_law_1.2,0.03859840035438537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,power_law_1.01,0.470304012298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,power_law_1.2,0.03859840035438537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,power_law_1.01,0.8071999549865723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,power_law_1.2,0.044947201013565065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,power_law_1.2,0.04902400076389313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,power_law_1.01,0.9902848243713379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,power_law_1.2,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,power_law_1.01,1.5768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,power_law_1.2,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,power_law_1.01,3.609881591796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,power_law_1.2,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,power_law_1.2,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,power_law_1.2,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,power_law_1.2,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,power_law_1.2,0.05416319966316223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,power_law_1.2,0.06559360027313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,power_law_1.2,0.07095680236816407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,power_law_1.2,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,power_law_1.2,0.0807807981967926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,power_law_1.2,0.08405759930610657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,power_law_1.2,0.10617599487304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,power_law_1.2,0.13771519660949708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,power_law_1.2,0.14612480401992797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,power_law_1.2,0.18585599660873414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,power_law_1.2,0.2851775884628296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,power_law_1.01,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,power_law_1.2,0.3478208065032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,power_law_1.01,0.050911998748779295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,power_law_1.2,0.41276798248291013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,power_law_1.01,0.03413119912147522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,power_law_1.2,0.7146240234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,power_law_1.2,1.0013504028320312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,power_law_1.01,0.05501440167427063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,power_law_1.2,1.1576064109802247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,power_law_1.01,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,power_law_1.2,1.798431968688965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,power_law_1.01,0.06526079773902893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,power_law_1.01,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,power_law_1.2,4.624051284790039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,power_law_1.01,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,power_law_1.01,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,power_law_1.01,0.04744960069656372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,power_law_1.01,0.050316798686981204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,power_law_1.01,0.050732797384262084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,power_law_1.2,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,power_law_1.01,0.05421440005302429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,power_law_1.2,0.03633280098438263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,power_law_1.2,0.03694719970226288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,power_law_1.01,0.07203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,power_law_1.2,0.03775359988212586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,power_law_1.01,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,power_law_1.01,0.07938560247421264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,power_law_1.2,0.03919999897480011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,power_law_1.2,0.0412416011095047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,power_law_1.01,0.11195520162582398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,power_law_1.01,0.13244800567626952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,power_law_1.2,0.04371199905872345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,power_law_1.01,0.16725759506225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,power_law_1.01,0.21006081104278565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,power_law_1.2,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,power_law_1.01,0.28952960968017577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,power_law_1.2,0.05088000297546387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,power_law_1.01,0.3544255971908569
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,power_law_1.2,0.051097601652145386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,power_law_1.01,0.4773248195648193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,power_law_1.2,0.0525056004524231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,power_law_1.01,0.6753664016723633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,power_law_1.2,0.06541439890861511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,power_law_1.01,0.8985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,power_law_1.2,0.07175040245056152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,power_law_1.01,0.22373759746551514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,power_law_1.01,1.3022527694702148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,power_law_1.01,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,power_law_1.2,0.06540160179138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,power_law_1.01,0.1047551989555359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,power_law_1.01,2.6610944747924803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,power_law_1.2,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,power_law_1.01,0.0961471974849701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,power_law_1.01,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,power_law_1.2,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,power_law_1.01,0.08532480001449586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,power_law_1.01,0.09347839951515198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,power_law_1.2,0.11067520380020142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,power_law_1.01,0.10191359519958496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,power_law_1.2,0.1424191951751709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,power_law_1.01,0.09100800156593322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,power_law_1.01,0.14041600227355958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,power_law_1.2,0.17946879863739013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,power_law_1.01,0.09471359848976135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,power_law_1.01,0.16500480175018312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,power_law_1.2,0.21982719898223876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,power_law_1.01,0.2178368091583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,power_law_1.01,0.10351999998092651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,power_law_1.2,0.27984640598297117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,power_law_1.01,0.2702591896057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,power_law_1.01,0.10371840000152588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,power_law_1.2,0.38489599227905275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,power_law_1.01,0.3349760055541992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,power_law_1.2,0.44490880966186525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,power_law_1.01,0.10658559799194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,power_law_1.01,0.5915967941284179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,power_law_1.2,0.6998784065246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,power_law_1.01,0.10290559530258178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,power_law_1.01,0.6630784034729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,power_law_1.2,0.9751296043395996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,power_law_1.01,0.10659199953079224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,power_law_1.01,1.0581184387207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,power_law_1.2,1.3705984115600587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,power_law_1.01,0.11065599918365479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,power_law_1.01,1.97521915435791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,power_law_1.2,2.5893695831298826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,power_law_1.01,0.1123263955116272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,power_law_1.01,0.1133504033088684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,power_law_1.01,0.12705279588699342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,power_law_1.01,0.12748160362243652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,power_law_1.01,0.13731199502944946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,power_law_1.2,0.1221951961517334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,power_law_1.01,0.15982719659805297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,power_law_1.2,0.1072383999824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,power_law_1.01,0.1569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,power_law_1.2,0.0748799979686737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,power_law_1.01,0.19055360555648804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,power_law_1.01,0.20568959712982177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,power_law_1.2,0.08349440097808838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,power_law_1.01,0.26797440052032473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,power_law_1.2,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,power_law_1.01,0.3208127975463867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,power_law_1.2,0.09127680063247681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,power_law_1.01,0.434662389755249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,power_law_1.2,0.10623359680175781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,power_law_1.2,0.10581120252609252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,power_law_1.01,0.5464896202087403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,power_law_1.2,0.10252799987792968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,power_law_1.01,0.7100671768188477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,power_law_1.2,0.10519039630889893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,power_law_1.01,0.8694592475891113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,power_law_1.2,0.09925119876861573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,power_law_1.01,1.1608832359313965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,power_law_1.01,0.11379200220108032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,power_law_1.2,0.11476479768753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,power_law_1.2,0.10928640365600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,power_law_1.01,0.1029312014579773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,power_law_1.01,1.8999744415283204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,power_law_1.2,0.10575360059738159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,power_law_1.2,0.12097920179367065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,power_law_1.01,0.08225280046463013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,power_law_1.2,0.06684799790382386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,power_law_1.2,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,power_law_1.01,3.8380287170410154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,power_law_1.01,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,power_law_1.2,0.07379840016365051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,power_law_1.2,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,power_law_1.01,0.08001279830932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,power_law_1.2,0.08487679958343505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,power_law_1.2,0.12895359992980956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,power_law_1.01,0.08798080086708068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,power_law_1.2,0.0844543993473053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,power_law_1.2,0.1382143974304199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,power_law_1.01,0.09454079866409301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,power_law_1.2,0.09735680222511292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,power_law_1.2,0.151692795753479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,power_law_1.2,0.10042879581451417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,power_law_1.2,0.1748479962348938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,power_law_1.01,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,power_law_1.2,0.10043519735336304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,power_law_1.2,0.2073983907699585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,power_law_1.01,0.10191999673843384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,power_law_1.2,0.10083839893341065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,power_law_1.2,0.23627519607543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,power_law_1.01,0.10253440141677857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,power_law_1.2,0.10576640367507935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,power_law_1.2,0.31123199462890627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,power_law_1.01,0.1047808051109314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,power_law_1.2,0.10698239803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,power_law_1.2,0.3863231897354126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,power_law_1.01,0.10723199844360351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,power_law_1.2,0.10819200277328492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,power_law_1.2,0.5473536014556885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,power_law_1.01,0.1137984037399292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,power_law_1.2,0.115174400806427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,power_law_1.2,0.6219200134277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,power_law_1.01,0.11766400337219238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,power_law_1.2,0.12213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,power_law_1.2,0.9772095680236816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,power_law_1.01,0.12034560441970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,power_law_1.2,0.12746880054473878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,power_law_1.2,1.3960448265075684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,power_law_1.01,0.13119360208511352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,power_law_1.2,0.13689600229263305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,power_law_1.2,1.7788223266601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,power_law_1.01,0.15148160457611085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,power_law_1.2,0.16350719928741456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,power_law_1.01,0.0971455991268158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,power_law_1.2,2.6520767211914062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,power_law_1.01,0.14778879880905152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,power_law_1.2,0.15143680572509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,power_law_1.01,0.11867519617080688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,power_law_1.01,0.1785024046897888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,power_law_1.2,0.19525760412216187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,power_law_1.2,6.576882934570312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,power_law_1.01,0.18977919816970826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,power_law_1.01,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,power_law_1.01,0.23319680690765382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,power_law_1.01,0.07976319789886474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,power_law_1.01,0.28705921173095705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,power_law_1.01,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,power_law_1.01,0.38842239379882815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,power_law_1.01,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,power_law_1.01,0.4478271961212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,power_law_1.01,0.10126719474792481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,power_law_1.01,0.6349440097808838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,power_law_1.01,0.10329600572586059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,power_law_1.01,0.847590446472168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,power_law_1.01,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,power_law_1.01,1.0165568351745606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,power_law_1.01,0.10311039686203002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,power_law_1.01,1.4998720169067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,power_law_1.01,0.10781439542770385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,power_law_1.01,0.11068799495697021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,power_law_1.01,3.266886520385742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,power_law_1.01,0.11355520486831665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,power_law_1.01,0.12665599584579468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,power_law_1.01,0.13935359716415405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,power_law_1.01,0.14919040203094483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,power_law_1.01,0.1553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,power_law_1.2,0.09352319836616516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,power_law_1.01,0.173363196849823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,power_law_1.2,0.10172799825668336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,power_law_1.01,0.20364799499511718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,power_law_1.2,0.058508801460266116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,power_law_1.01,0.23868799209594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,power_law_1.2,0.06547840237617493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,power_law_1.01,0.2984895944595337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,power_law_1.2,0.0773311972618103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,power_law_1.01,0.35992319583892823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,power_law_1.01,0.4375296115875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,power_law_1.2,0.09824000000953674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,power_law_1.01,0.7019264221191406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,power_law_1.2,0.09905920028686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,power_law_1.2,0.09782400131225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,power_law_1.01,0.8170432090759278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,power_law_1.2,0.09926400184631348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,power_law_1.01,0.9489279747009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,power_law_1.2,0.10602240562438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,power_law_1.01,1.5956735610961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,power_law_1.2,0.10314879417419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,power_law_1.2,0.11092480421066284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,power_law_1.01,2.9745983123779296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,power_law_1.01,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,power_law_1.2,0.11299200057983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,power_law_1.01,0.08492799997329711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,power_law_1.2,0.1191167950630188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,power_law_1.01,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,power_law_1.2,0.125273597240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,power_law_1.01,0.0630016028881073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,power_law_1.2,0.13878400325775148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,power_law_1.01,0.07446399927139283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,power_law_1.2,0.15557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,power_law_1.01,0.08511999845504761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,power_law_1.2,0.16050560474395753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,power_law_1.01,0.0976256012916565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,power_law_1.2,0.17811199426651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,power_law_1.01,0.10130560398101807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,power_law_1.2,0.20781440734863282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,power_law_1.01,0.10438400506973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,power_law_1.2,0.2583872079849243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,power_law_1.01,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,power_law_1.2,0.31449599266052247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,power_law_1.01,0.1082751989364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,power_law_1.2,0.391923189163208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,power_law_1.01,0.11072640419006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,power_law_1.2,0.5502336025238037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,power_law_1.01,0.11359360218048095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,power_law_1.2,0.7044415950775147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,power_law_1.01,0.11584639549255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,power_law_1.2,1.0696000099182128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,power_law_1.01,0.12464640140533448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,power_law_1.2,1.322316837310791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,power_law_1.01,0.13141759634017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,power_law_1.01,0.1449280023574829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,power_law_1.2,2.083769607543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,power_law_1.2,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,power_law_1.01,0.1553663969039917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,power_law_1.2,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,power_law_1.2,3.738150405883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,power_law_1.01,0.1760640025138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,power_law_1.01,0.20042240619659424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,power_law_1.2,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,power_law_1.01,0.2280639886856079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,power_law_1.2,0.07669119834899903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,power_law_1.01,0.27311999797821046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,power_law_1.2,0.08241919875144958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,power_law_1.01,0.34236159324646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,power_law_1.2,0.09635199904441834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,power_law_1.01,0.4136256217956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,power_law_1.2,0.10126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,power_law_1.01,0.5133632183074951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,power_law_1.2,0.10290559530258178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,power_law_1.01,0.7154880046844483
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,power_law_1.2,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,power_law_1.01,0.978451156616211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,power_law_1.2,0.10945919752120972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,power_law_1.01,1.0654911994934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,power_law_1.2,0.10945919752120972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,power_law_1.01,1.7734912872314452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,power_law_1.2,0.11397119760513305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,power_law_1.2,0.11617920398712159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,power_law_1.01,3.155072021484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,power_law_1.2,0.12871040105819703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,power_law_1.2,0.12912000417709352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,power_law_1.2,0.13690240383148194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,power_law_1.2,0.16741119623184203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,power_law_1.2,0.18154879808425903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,power_law_1.2,0.20120959281921386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,power_law_1.2,0.23274879455566405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,power_law_1.2,0.2950079917907715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,power_law_1.2,0.35459840297698975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,power_law_1.01,0.060159999132156375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,power_law_1.2,0.4629312038421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,power_law_1.01,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,power_law_1.2,0.5595903873443604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,power_law_1.01,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,power_law_1.2,0.8325887680053711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,power_law_1.01,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,power_law_1.2,0.9763584136962891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,power_law_1.2,1.1935808181762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,power_law_1.01,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,power_law_1.2,2.0444095611572264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,power_law_1.01,0.10848640203475952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,power_law_1.01,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,power_law_1.2,4.2789054870605465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,power_law_1.01,0.1121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,power_law_1.01,0.11831040382385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,power_law_1.01,0.12403199672698975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,power_law_1.01,0.11953920125961304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,power_law_1.2,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,power_law_1.01,0.12999039888381958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,power_law_1.2,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,power_law_1.01,0.13511040210723876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,power_law_1.01,0.1445248007774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,power_law_1.2,0.06403200030326843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,power_law_1.01,0.1564095973968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,power_law_1.2,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,power_law_1.01,0.1782912015914917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,power_law_1.2,0.08615040183067321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,power_law_1.01,0.20861439704895018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,power_law_1.2,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,power_law_1.01,0.23995521068572997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,power_law_1.2,0.1060096025466919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,power_law_1.01,0.2805183887481689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,power_law_1.2,0.10969599485397338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,power_law_1.01,0.3378304004669189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,power_law_1.2,0.11235840320587158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,power_law_1.01,0.42244482040405273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,power_law_1.2,0.11747839450836181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,power_law_1.01,0.536300802230835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,power_law_1.2,0.1211583971977234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,power_law_1.01,0.7044479846954346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,power_law_1.2,0.12567039728164672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,power_law_1.01,0.8842623710632325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,power_law_1.2,0.13099520206451415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,power_law_1.01,1.199443244934082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,power_law_1.2,0.13630720376968383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,power_law_1.01,1.444377613067627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,power_law_1.2,0.14207359552383422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,power_law_1.2,0.15781760215759277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,power_law_1.01,2.1460287094116213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,power_law_1.2,0.1768704056739807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,power_law_1.01,4.14384651184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,power_law_1.2,0.21367039680480956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,power_law_1.2,0.25259521007537844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,power_law_1.2,0.28330240249633787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,power_law_1.2,0.3455744028091431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,power_law_1.2,0.4259007930755615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,power_law_1.2,0.5530816078186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,power_law_1.2,0.2009984016418457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,power_law_1.01,0.06440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,power_law_1.2,0.25813119411468505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,power_law_1.2,0.6691967964172363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,power_law_1.01,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,power_law_1.2,0.3017600059509277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,power_law_1.2,0.9698368072509765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,power_law_1.01,0.07299200296401978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,power_law_1.2,0.44532480239868166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,power_law_1.2,1.2526911735534667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,power_law_1.01,0.08426880240440368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,power_law_1.2,0.5333695888519288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,power_law_1.01,0.10126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,power_law_1.2,1.5248576164245606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,power_law_1.2,0.8092351913452148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,power_law_1.01,0.11908479928970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,power_law_1.2,2.431667137145996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,power_law_1.01,0.1268671989440918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,power_law_1.2,1.0279616355895995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,power_law_1.2,4.699481582641601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,power_law_1.01,0.12829439640045165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,power_law_1.2,1.218611240386963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,power_law_1.01,0.13074560165405275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,power_law_1.2,2.0783935546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,power_law_1.01,0.13771519660949708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,power_law_1.01,0.14468480348587037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,power_law_1.2,4.6256767272949215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,power_law_1.01,0.14673279523849486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,power_law_1.01,0.15656319856643677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,power_law_1.01,0.16537599563598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,power_law_1.01,0.17212159633636476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,power_law_1.01,0.18563200235366822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,power_law_1.01,0.2171839952468872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,power_law_1.01,0.2517888069152832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,power_law_1.01,0.30215680599212646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,power_law_1.01,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,power_law_1.01,0.3769023895263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,power_law_1.01,0.4772031784057617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,power_law_1.01,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,power_law_1.01,0.6222591876983643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,power_law_1.2,0.0500544011592865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,power_law_1.01,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,power_law_1.01,0.8055744171142578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,power_law_1.01,0.051744002103805545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,power_law_1.01,0.9972479820251465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,power_law_1.2,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,power_law_1.01,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,power_law_1.2,0.04472959935665131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,power_law_1.01,1.3538175582885743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,power_law_1.01,0.055212801694869994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,power_law_1.2,0.04267520010471344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,power_law_1.01,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,power_law_1.01,1.7656383514404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,power_law_1.2,0.052313601970672606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,power_law_1.01,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,power_law_1.01,2.1160831451416016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,power_law_1.2,0.053529602289199826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,power_law_1.01,0.06117119789123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,power_law_1.2,0.05763840079307556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,power_law_1.01,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,power_law_1.01,3.135974311828613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,power_law_1.2,0.0584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,power_law_1.01,0.06627200245857238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,power_law_1.01,6.219827270507812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,power_law_1.2,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,power_law_1.01,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,power_law_1.2,0.06376960277557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,power_law_1.01,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,power_law_1.2,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,power_law_1.2,0.06972159743309021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,power_law_1.01,0.06833279728889466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,power_law_1.2,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,power_law_1.01,0.07979519963264466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,power_law_1.2,0.06133120059967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,power_law_1.01,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,power_law_1.2,0.06541439890861511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,power_law_1.2,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,power_law_1.01,0.1326464056968689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,power_law_1.2,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,power_law_1.01,0.16417920589447021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,power_law_1.2,0.10167039632797241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,power_law_1.01,0.22705280780792236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,power_law_1.2,0.13340799808502196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,power_law_1.01,0.03716480135917664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,power_law_1.01,0.3016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,power_law_1.01,0.03839359879493713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,power_law_1.2,0.15880320072174073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,power_law_1.01,0.3630336046218872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,power_law_1.01,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,power_law_1.2,0.2321216106414795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,power_law_1.01,0.5235904216766357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,power_law_1.01,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,power_law_1.2,0.3439296007156372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,power_law_1.01,0.7212287902832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,power_law_1.01,0.041043201088905336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,power_law_1.2,0.45187840461730955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,power_law_1.01,1.06876802444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,power_law_1.01,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,power_law_1.2,0.598092794418335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,power_law_1.01,2.5455743789672853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,power_law_1.2,1.0658623695373535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,power_law_1.01,0.04678399860858917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,power_law_1.01,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,power_law_1.2,1.2292927742004394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,power_law_1.2,1.667353630065918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,power_law_1.01,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,power_law_1.01,0.05498239994049072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,power_law_1.2,4.91589126586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,power_law_1.01,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,power_law_1.01,0.046988800168037415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,power_law_1.01,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,power_law_1.01,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,power_law_1.01,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,power_law_1.01,0.08796160221099854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,power_law_1.01,0.10022399425506592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,power_law_1.2,0.03903360068798065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,power_law_1.01,0.10085120201110839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,power_law_1.2,0.0341376006603241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,power_law_1.01,0.12072319984436035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,power_law_1.01,0.1336192011833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,power_law_1.2,0.03658879995346069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,power_law_1.2,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,power_law_1.01,0.1872704029083252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,power_law_1.2,0.045388799905776975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,power_law_1.01,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,power_law_1.01,0.22168960571289062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,power_law_1.2,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,power_law_1.01,0.30707199573516847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,power_law_1.2,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,power_law_1.01,0.03386879861354828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,power_law_1.01,0.44819841384887693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,power_law_1.2,0.05295360088348389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,power_law_1.01,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,power_law_1.01,0.5571392059326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,power_law_1.2,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,power_law_1.01,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,power_law_1.01,0.7445312023162842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,power_law_1.2,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,power_law_1.01,0.04472959935665131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,power_law_1.01,0.044121599197387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,power_law_1.2,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,power_law_1.2,0.05051519870758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,power_law_1.01,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,power_law_1.2,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,power_law_1.01,0.046751999855041505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,power_law_1.2,0.06198400259017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,power_law_1.01,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,power_law_1.2,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,power_law_1.01,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,power_law_1.2,0.07733759880065919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,power_law_1.01,0.061318397521972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,power_law_1.2,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,power_law_1.01,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,power_law_1.2,0.11155200004577637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,power_law_1.01,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,power_law_1.2,0.11236480474472046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,power_law_1.01,0.05886080265045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,power_law_1.2,0.1363263964653015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,power_law_1.01,0.05886080265045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,power_law_1.2,0.15619200468063354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,power_law_1.01,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,power_law_1.2,0.213753604888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,power_law_1.01,0.07320320010185241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,power_law_1.01,0.09550719857215881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,power_law_1.2,0.2992768049240112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,power_law_1.01,0.09838719964027405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,power_law_1.2,0.5579391956329346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,power_law_1.01,0.12152960300445556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,power_law_1.2,0.6198463916778565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,power_law_1.01,0.1343999981880188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,power_law_1.2,0.843289566040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,power_law_1.01,0.1954624056816101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,power_law_1.2,1.199027156829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,power_law_1.01,0.22371840476989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,power_law_1.2,2.9885631561279298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,power_law_1.01,0.3418816089630127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,power_law_1.01,0.4313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,power_law_1.01,0.5472511768341064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,power_law_1.01,0.8243583679199219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,power_law_1.01,1.5395648002624511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,power_law_1.2,0.04620159864425659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,power_law_1.2,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,power_law_1.2,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,power_law_1.2,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,power_law_1.01,0.03612160086631775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,power_law_1.2,0.04948480129241943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,power_law_1.01,0.030796799063682555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,power_law_1.2,0.05175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,power_law_1.01,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,power_law_1.01,0.03550719916820526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,power_law_1.01,0.04451839923858643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,power_law_1.01,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,power_law_1.01,0.0471807986497879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,power_law_1.01,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,power_law_1.01,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,power_law_1.01,0.05495679974555969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,power_law_1.01,0.05374079942703247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,power_law_1.01,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,power_law_1.01,0.0602944016456604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,power_law_1.01,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,power_law_1.01,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,power_law_1.01,0.056806397438049314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,power_law_1.01,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,power_law_1.01,0.07237120270729065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,power_law_1.01,0.08547840118408204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,power_law_1.01,0.09715200066566468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,power_law_1.01,0.11272319555282592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,power_law_1.01,0.14794880151748657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,power_law_1.01,0.16002559661865234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,power_law_1.01,0.20405759811401367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,power_law_1.01,0.258950400352478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,power_law_1.01,0.3894207954406738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,power_law_1.01,0.4924160003662109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,power_law_1.01,0.6067008018493653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,power_law_1.2,0.05931519865989685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,power_law_1.01,0.9579263687133789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,power_law_1.2,0.0652671992778778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,power_law_1.2,0.06260480284690857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,power_law_1.01,1.867238426208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,power_law_1.2,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,power_law_1.2,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,power_law_1.2,0.09454079866409301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,power_law_1.2,0.12015360593795776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,power_law_1.2,0.125273597240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,power_law_1.2,0.1293503999710083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,power_law_1.2,0.1291391968727112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,power_law_1.2,0.13672319650650025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,power_law_1.2,0.1416640043258667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,power_law_1.2,0.14534399509429932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,power_law_1.2,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,power_law_1.2,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,power_law_1.2,0.17400959730148316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,power_law_1.2,0.03612799942493439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,power_law_1.2,0.033267199993133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,power_law_1.2,0.19264639616012574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,power_law_1.2,0.033452799916267394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,power_law_1.2,0.2278592109680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,power_law_1.2,0.0344895988702774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,power_law_1.2,0.25941760540008546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,power_law_1.2,0.04186240136623383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,power_law_1.2,0.31040000915527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,power_law_1.2,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,power_law_1.2,0.38209919929504393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,power_law_1.2,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,power_law_1.2,0.4871679782867432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,power_law_1.2,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,power_law_1.2,0.5817728042602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,power_law_1.2,0.05394560098648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,power_law_1.2,0.7990592002868653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,power_law_1.2,0.05408639907836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,power_law_1.2,1.0182016372680665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,power_law_1.2,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,power_law_1.2,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,power_law_1.2,1.3976896286010743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,power_law_1.2,0.06581760048866273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,power_law_1.2,1.8603200912475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,power_law_1.2,2.064499282836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,power_law_1.2,0.05414400100708008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,power_law_1.2,3.3353023529052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,power_law_1.2,0.06600959897041321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,power_law_1.2,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,power_law_1.2,6.528953552246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,power_law_1.2,0.08528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,power_law_1.2,0.10780160427093506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,power_law_1.2,0.11845120191574096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,power_law_1.2,0.16391680240631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,power_law_1.2,0.17968640327453614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,power_law_1.2,0.24113919734954833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,power_law_1.2,0.31547520160675047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,power_law_1.2,0.4653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,power_law_1.2,0.6230783939361573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,power_law_1.2,0.8293184280395508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,power_law_1.2,1.4635775566101075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,power_law_1.2,2.721260833740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,power_law_1.01,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,power_law_1.01,0.033529600501060484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,power_law_1.01,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,power_law_1.01,1.7316671371459962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,power_law_1.01,0.04049279987812042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,power_law_1.01,0.04499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,power_law_1.01,0.04826880097389221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,power_law_1.01,0.04848000109195709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,power_law_1.01,0.04867840111255646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,power_law_1.01,0.049497601389884946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,power_law_1.01,0.0515392005443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,power_law_1.01,0.05605760216712952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,power_law_1.01,0.06444799900054932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,power_law_1.2,0.03611519932746887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,power_law_1.2,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,power_law_1.01,0.0759168028831482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,power_law_1.2,0.03283199965953827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,power_law_1.01,0.09392639994621277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,power_law_1.2,0.03426559865474701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,power_law_1.01,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,power_law_1.2,0.03837440013885498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,power_law_1.01,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,power_law_1.01,0.14124159812927245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,power_law_1.01,0.18343679904937743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,power_law_1.2,0.047167998552322385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,power_law_1.01,0.2282815933227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,power_law_1.2,0.04792320132255554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,power_law_1.01,0.31674880981445314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,power_law_1.2,0.046982398629188536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,power_law_1.01,0.03715839982032776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,power_law_1.01,0.3642688035964966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,power_law_1.2,0.0529151976108551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,power_law_1.01,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,power_law_1.01,0.48133120536804197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,power_law_1.2,0.05415679812431336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,power_law_1.01,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,power_law_1.01,0.6157631874084473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,power_law_1.2,0.06090880036354065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,power_law_1.01,0.044326400756835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,power_law_1.01,0.7810239791870117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,power_law_1.01,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,power_law_1.2,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,power_law_1.01,1.1318528175354003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,power_law_1.01,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,power_law_1.2,0.06970239877700805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,power_law_1.01,0.0531391978263855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,power_law_1.2,0.07750399708747864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,power_law_1.01,2.386662483215332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,power_law_1.01,0.054771202802658084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,power_law_1.2,0.09018239974975586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,power_law_1.01,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,power_law_1.2,0.10084480047225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,power_law_1.01,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,power_law_1.2,0.11824640035629272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,power_law_1.01,0.059494400024414064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,power_law_1.2,0.14672640562057496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,power_law_1.2,0.2113663911819458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,power_law_1.01,0.06644480228424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,power_law_1.2,0.23070080280303956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,power_law_1.01,0.07463679909706115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,power_law_1.2,0.317523193359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,power_law_1.01,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,power_law_1.2,0.4231935977935791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,power_law_1.01,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,power_law_1.2,0.6017727851867676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,power_law_1.01,0.10699520111083985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,power_law_1.2,0.6908544063568115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,power_law_1.2,0.9083647727966309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,power_law_1.01,0.14713599681854247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,power_law_1.01,0.18256640434265137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,power_law_1.2,1.587071990966797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,power_law_1.01,0.2409280061721802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,power_law_1.2,3.207449722290039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,power_law_1.01,0.3183552026748657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,power_law_1.2,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,power_law_1.01,0.42771201133728026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,power_law_1.2,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,power_law_1.01,0.5116672039031982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,power_law_1.2,0.05889279842376709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,power_law_1.01,0.6708159923553467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,power_law_1.2,0.035366401076316833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,power_law_1.01,0.9095871925354004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,power_law_1.2,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,power_law_1.01,1.1002623558044433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,power_law_1.2,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,power_law_1.01,1.7312511444091796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,power_law_1.2,0.06709759831428527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,power_law_1.2,0.0762943983078003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,power_law_1.2,0.0490880012512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,power_law_1.01,3.463052749633789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,power_law_1.2,0.09003520011901855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,power_law_1.2,0.052179199457168576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,power_law_1.2,0.11338880062103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,power_law_1.2,0.10559999942779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,power_law_1.2,0.05380480289459229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,power_law_1.2,0.1457535982131958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,power_law_1.2,0.0543936014175415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,power_law_1.2,0.16049920320510863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,power_law_1.2,0.05543680191040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,power_law_1.2,0.06076800227165222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,power_law_1.2,0.22664320468902588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,power_law_1.2,0.06302080154418946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,power_law_1.2,0.3089792013168335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,power_law_1.2,0.06897280216217042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,power_law_1.2,0.38373761177062987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,power_law_1.01,0.08978559970855712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,power_law_1.2,0.0759168028831482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,power_law_1.2,0.649951982498169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,power_law_1.01,0.08978559970855712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,power_law_1.2,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,power_law_1.2,0.7318848133087158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,power_law_1.01,0.0639743983745575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,power_law_1.2,0.0896127998828888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,power_law_1.01,0.07257599830627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,power_law_1.2,0.10705920457839965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,power_law_1.2,1.243673610687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,power_law_1.01,0.07667840123176575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,power_law_1.2,0.1199295997619629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,power_law_1.2,2.3024959564208984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,power_law_1.01,0.08343039751052857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,power_law_1.2,0.1473855972290039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,power_law_1.01,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,power_law_1.2,0.18792959451675414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,power_law_1.01,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,power_law_1.2,0.24506878852844238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,power_law_1.01,0.0863103985786438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,power_law_1.2,0.3214656114578247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,power_law_1.2,0.09184640049934387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,power_law_1.01,0.08856319785118102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,power_law_1.2,0.4408576011657715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,power_law_1.2,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,power_law_1.01,0.09080320000648498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,power_law_1.2,0.501043176651001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,power_law_1.2,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,power_law_1.01,0.08917120099067688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,power_law_1.2,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,power_law_1.2,0.7671103954315186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,power_law_1.01,0.09591680169105529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,power_law_1.2,0.9981311798095703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,power_law_1.01,0.10085120201110839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,power_law_1.2,0.08283519744873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,power_law_1.2,1.2760319709777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,power_law_1.01,0.10718719959259033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,power_law_1.2,0.08447359800338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,power_law_1.2,1.797248077392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,power_law_1.01,0.11435519456863404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,power_law_1.2,0.08876799941062927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,power_law_1.01,0.12193919420242309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,power_law_1.2,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,power_law_1.2,4.0127616882324215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,power_law_1.01,0.14446719884872436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,power_law_1.01,0.13299839496612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,power_law_1.01,0.16514559984207153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,power_law_1.01,0.18234879970550538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,power_law_1.01,0.22926080226898193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,power_law_1.01,0.25504000186920167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,power_law_1.01,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,power_law_1.01,0.3513024091720581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,power_law_1.01,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,power_law_1.01,0.4375296115875244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,power_law_1.01,0.06260480284690857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,power_law_1.01,0.6769343852996826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,power_law_1.01,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,power_law_1.01,0.08612480163574218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,power_law_1.01,0.8522432327270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,power_law_1.01,0.08369280099868774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,power_law_1.01,1.043942356109619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,power_law_1.01,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,power_law_1.01,1.6354047775268554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,power_law_1.01,0.08880640268325805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,power_law_1.01,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,power_law_1.01,3.3495742797851564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,power_law_1.01,0.09082880020141601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,power_law_1.01,0.09203839898109437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,power_law_1.01,0.09249280095100403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,power_law_1.01,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,power_law_1.2,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,power_law_1.01,0.10949120521545411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,power_law_1.01,0.11195520162582398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,power_law_1.2,0.06998400092124939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,power_law_1.01,0.11214720010757447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,power_law_1.2,0.0822655975818634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,power_law_1.01,0.13181439638137818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,power_law_1.2,0.08594560027122497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,power_law_1.01,0.134278404712677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,power_law_1.2,0.08737919926643371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,power_law_1.01,0.15926400423049927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,power_law_1.2,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,power_law_1.01,0.171942400932312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,power_law_1.2,0.09066879749298096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,power_law_1.01,0.2301248073577881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,power_law_1.2,0.0920960009098053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,power_law_1.01,0.25141119956970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,power_law_1.2,0.09291520118713378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,power_law_1.01,0.36202239990234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,power_law_1.2,0.09455999732017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,power_law_1.01,0.39927680492401124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,power_law_1.2,0.10417920351028442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,power_law_1.01,0.6462719917297364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,power_law_1.2,0.11196160316467285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,power_law_1.01,0.7511231899261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,power_law_1.2,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,power_law_1.01,0.07278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,power_law_1.01,0.9604415893554688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,power_law_1.2,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,power_law_1.01,0.077702397108078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,power_law_1.2,0.1363263964653015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,power_law_1.01,1.461580753326416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,power_law_1.2,0.14268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,power_law_1.01,0.06357120275497437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,power_law_1.01,2.9553855895996093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,power_law_1.2,0.17360639572143555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,power_law_1.2,0.17932800054550171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,power_law_1.01,0.08363519906997681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,power_law_1.2,0.23464319705963135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,power_law_1.2,0.28562560081481936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,power_law_1.01,0.08917760252952575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,power_law_1.2,0.4066624164581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,power_law_1.01,0.09121919870376587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,power_law_1.2,0.501471996307373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,power_law_1.01,0.09218559861183166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,power_law_1.2,0.7867648124694824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,power_law_1.01,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,power_law_1.2,0.9661888122558594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,power_law_1.01,0.09470080137252808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,power_law_1.2,1.4460160255432128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,power_law_1.01,0.09757440090179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,power_law_1.2,1.6643455505371094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,power_law_1.01,0.10247679948806762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,power_law_1.01,0.10944639444351197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,power_law_1.2,4.876627349853516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,power_law_1.01,0.1118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,power_law_1.01,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,power_law_1.01,0.13422080278396606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,power_law_1.01,0.1538879990577698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,power_law_1.01,0.19478399753570558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,power_law_1.01,0.19341440200805665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,power_law_1.01,0.24092159271240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,power_law_1.2,0.06914560198783874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,power_law_1.2,0.059539198875427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,power_law_1.01,0.28351359367370604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,power_law_1.2,0.05482239723205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,power_law_1.01,0.3877824068069458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,power_law_1.2,0.05708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,power_law_1.01,0.48792319297790526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,power_law_1.01,0.658073616027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,power_law_1.2,0.08265600204467774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,power_law_1.01,0.8479424476623535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,power_law_1.2,0.08389120101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,power_law_1.01,0.9902912139892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,power_law_1.2,0.08716800212860107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,power_law_1.2,0.09045119881629944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,power_law_1.01,1.4822208404541015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,power_law_1.2,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,power_law_1.01,3.14847354888916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,power_law_1.2,0.09578239917755127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,power_law_1.2,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,power_law_1.2,0.09905920028686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,power_law_1.2,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,power_law_1.01,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,power_law_1.01,0.05975040197372437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,power_law_1.2,0.12075519561767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,power_law_1.01,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,power_law_1.2,0.12565759420394898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,power_law_1.01,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,power_law_1.2,0.14409600496292113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,power_law_1.01,0.07203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,power_law_1.2,0.150655996799469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,power_law_1.01,0.0904640018939972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,power_law_1.2,0.1881600022315979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,power_law_1.01,0.09352959990501404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,power_law_1.01,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,power_law_1.2,0.21087999343872071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,power_law_1.01,0.09619200229644775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,power_law_1.2,0.26410880088806155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,power_law_1.01,0.09720960259437561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,power_law_1.2,0.2995392084121704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,power_law_1.01,0.09905920028686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,power_law_1.2,0.4025536060333252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,power_law_1.01,0.10622080564498901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,power_law_1.2,0.519488000869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,power_law_1.01,0.10438400506973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,power_law_1.2,0.7597248077392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,power_law_1.01,0.11256959438323974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,power_law_1.2,1.0071295738220214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,power_law_1.01,0.11849600076675415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,power_law_1.2,1.3696640014648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,power_law_1.01,0.13100800514221192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,power_law_1.01,0.138374400138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,power_law_1.2,2.123084831237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,power_law_1.2,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,power_law_1.01,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,power_law_1.2,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,power_law_1.2,4.378534317016602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,power_law_1.01,0.17933440208435059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,power_law_1.2,0.05783039927482605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,power_law_1.01,0.2102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,power_law_1.2,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,power_law_1.01,0.24097280502319335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,power_law_1.2,0.06644480228424073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,power_law_1.01,0.29361279010772706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,power_law_1.2,0.08733440041542054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,power_law_1.01,0.37431039810180666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,power_law_1.2,0.09224960207939148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,power_law_1.01,0.45971198081970216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,power_law_1.2,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,power_law_1.01,0.6231296062469482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,power_law_1.2,0.0977728009223938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,power_law_1.2,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,power_law_1.01,0.7891520023345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,power_law_1.2,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,power_law_1.01,1.0958208084106444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,power_law_1.2,0.10698239803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,power_law_1.01,1.3333888053894043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,power_law_1.2,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,power_law_1.01,1.8951488494873048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,power_law_1.2,0.11804800033569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,power_law_1.2,0.12890880107879638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,power_law_1.01,4.126655960083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,power_law_1.2,0.1348479986190796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,power_law_1.2,0.14384000301361083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,power_law_1.2,0.16270079612731933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,power_law_1.2,0.18353919982910155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,power_law_1.2,0.21553280353546142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,power_law_1.2,0.24624640941619874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,power_law_1.2,0.3044095993041992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,power_law_1.2,0.40599679946899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,power_law_1.2,0.5137279987335205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,power_law_1.2,0.6556479930877686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,power_law_1.2,0.8923968315124512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,power_law_1.2,1.2227328300476075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,power_law_1.2,0.08972160220146179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,power_law_1.2,0.08936960101127625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,power_law_1.2,1.5985471725463867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,power_law_1.2,0.09327999949455261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,power_law_1.01,0.05746560096740723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,power_law_1.2,2.527302360534668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,power_law_1.2,0.09799039959907532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,power_law_1.01,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,power_law_1.2,0.10412800312042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,power_law_1.01,0.060153597593307497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,power_law_1.2,5.149772644042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,power_law_1.2,0.11006079912185669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,power_law_1.01,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,power_law_1.2,0.11313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,power_law_1.01,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,power_law_1.01,0.09863680005073547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,power_law_1.2,0.12789119482040406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,power_law_1.01,0.10131200551986694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,power_law_1.2,0.14629119634628296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,power_law_1.2,0.14261759519577027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,power_law_1.01,0.10601600408554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,power_law_1.2,0.17210880517959595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,power_law_1.2,0.19792640209197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,power_law_1.2,0.2587584018707275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,power_law_1.2,0.31096320152282714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,power_law_1.2,0.3900032043457031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,power_law_1.2,0.6658624172210693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,power_law_1.2,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,power_law_1.2,0.8661952018737793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,power_law_1.2,0.058713597059249875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,power_law_1.2,1.141983985900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,power_law_1.2,1.4209919929504395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,power_law_1.2,0.07672960162162781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,power_law_1.2,2.3935808181762694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,power_law_1.2,0.09619200229644775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,power_law_1.2,0.10047999620437623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,power_law_1.2,6.46561279296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,power_law_1.01,0.14036480188369752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,power_law_1.2,0.10807039737701415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,power_law_1.2,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,power_law_1.01,0.13423360586166383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,power_law_1.2,0.11523840427398682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,power_law_1.01,0.14056960344314576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,power_law_1.2,0.12037119865417481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,power_law_1.01,0.0850816011428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,power_law_1.2,0.1252671957015991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,power_law_1.01,0.10104960203170776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,power_law_1.2,0.12936960458755492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,power_law_1.2,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,power_law_1.01,0.1102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,power_law_1.2,0.14328960180282593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,power_law_1.01,0.12030719518661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,power_law_1.2,0.14943360090255736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,power_law_1.01,0.1289023995399475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,power_law_1.2,0.1615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,power_law_1.2,0.19489920139312744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,power_law_1.01,0.12951680421829223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,power_law_1.2,0.22848000526428222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,power_law_1.01,0.1217344045639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,power_law_1.2,0.2854207992553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,power_law_1.01,0.12930560111999512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,power_law_1.2,0.34418559074401855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,power_law_1.01,0.13605120182037353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,power_law_1.2,0.422438383102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,power_law_1.01,0.14017280340194702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,power_law_1.2,0.5375423908233643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,power_law_1.2,0.6839680194854736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,power_law_1.01,0.1430400013923645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,power_law_1.2,0.194649600982666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,power_law_1.01,0.15079679489135742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,power_law_1.2,0.8785344123840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,power_law_1.2,0.13526400327682495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,power_law_1.01,0.16433279514312743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,power_law_1.2,1.2256704330444337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,power_law_1.2,0.13608319759368898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,power_law_1.2,1.4660863876342773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,power_law_1.01,0.16105600595474243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,power_law_1.2,0.08238080143928528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,power_law_1.2,1.7747200012207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,power_law_1.01,0.21021440029144287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,power_law_1.2,0.09307519793510437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,power_law_1.01,0.17866239547729493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,power_law_1.2,2.96563835144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,power_law_1.2,0.10269440412521362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,power_law_1.01,0.22209279537200927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,power_law_1.2,6.192044830322265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,power_law_1.2,0.10413440465927123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,power_law_1.01,0.25608320236206056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,power_law_1.2,0.1196671962738037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,power_law_1.01,0.3020927906036377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,power_law_1.2,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,power_law_1.01,0.3705663919448853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,power_law_1.2,0.12502399682998658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,power_law_1.01,0.48096637725830077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,power_law_1.2,0.13729920387268066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,power_law_1.01,0.5227327823638916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,power_law_1.01,0.734278392791748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,power_law_1.2,0.1324031949043274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,power_law_1.01,0.9927424430847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,power_law_1.2,0.14958080053329467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,power_law_1.01,1.1866880416870118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,power_law_1.2,0.1647487998008728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,power_law_1.01,1.7894208908081055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,power_law_1.2,0.16843520402908324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,power_law_1.2,0.18420480489730834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,power_law_1.01,3.8030017852783202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,power_law_1.2,0.21144959926605225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,power_law_1.2,0.20161919593811034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,power_law_1.2,0.23170559406280516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,power_law_1.2,0.2853760004043579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,power_law_1.01,0.11257599592208863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,power_law_1.2,0.36586880683898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,power_law_1.01,0.1418496012687683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,power_law_1.2,0.42195839881896974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,power_law_1.01,0.1355072021484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,power_law_1.2,0.5796800136566163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,power_law_1.01,0.08554239869117737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,power_law_1.2,0.6372288227081299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,power_law_1.01,0.09947519898414611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,power_law_1.2,0.9562751770019531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,power_law_1.01,0.10682239532470703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,power_law_1.2,1.319007968902588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,power_law_1.01,0.1193343997001648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,power_law_1.2,1.7640192031860351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,power_law_1.01,0.11585919857025147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,power_law_1.2,2.634822463989258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,power_law_1.01,0.11340160369873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,power_law_1.01,0.1224128007888794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,power_law_1.2,4.918700790405273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,power_law_1.01,0.13141759634017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,power_law_1.2,0.11190400123596192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,power_law_1.01,0.13301759958267212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,power_law_1.2,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,power_law_1.01,0.13980159759521485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,power_law_1.2,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,power_law_1.01,0.15148160457611085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,power_law_1.2,0.07788159847259521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,power_law_1.01,0.14594559669494628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,power_law_1.2,0.09183359742164612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,power_law_1.01,0.1602944016456604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,power_law_1.2,0.09306880235671997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,power_law_1.01,0.17749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,power_law_1.2,0.09941120147705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,power_law_1.01,0.17564799785614013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,power_law_1.2,0.11415679454803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,power_law_1.01,0.20126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,power_law_1.2,0.11763199567794799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,power_law_1.01,0.23525760173797608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,power_law_1.2,0.11681920289993286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,power_law_1.01,0.2899391889572144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,power_law_1.2,0.12561919689178466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,power_law_1.01,0.3382591962814331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,power_law_1.2,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,power_law_1.01,0.4222400188446045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,power_law_1.2,0.13443200588226317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,power_law_1.01,0.5166528224945068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,power_law_1.2,0.14158719778060913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,power_law_1.01,0.7150976181030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,power_law_1.01,0.09838719964027405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,power_law_1.2,0.15471359491348266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,power_law_1.01,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,power_law_1.01,0.8496383666992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,power_law_1.2,0.15696640014648439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,power_law_1.01,0.14079359769821168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,power_law_1.2,0.1606528043746948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,power_law_1.01,1.0831232070922852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,power_law_1.2,0.20529279708862305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,power_law_1.01,1.6637311935424806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,power_law_1.01,0.07914239764213563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,power_law_1.2,0.18439680337905884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,power_law_1.01,3.130912017822266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,power_law_1.01,0.0949184000492096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,power_law_1.2,0.2222912073135376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,power_law_1.01,0.10145280361175538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,power_law_1.2,0.26182401180267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,power_law_1.01,0.11682560443878173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,power_law_1.2,0.3293951988220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,power_law_1.01,0.11989760398864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,power_law_1.2,0.35827839374542236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,power_law_1.01,0.12419840097427368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,power_law_1.2,0.48504958152770994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,power_law_1.01,0.1254271984100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,power_law_1.2,0.5608191967010498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,power_law_1.01,0.12952959537506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,power_law_1.2,0.8346303939819336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,power_law_1.01,0.1336192011833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,power_law_1.2,1.0222399711608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,power_law_1.01,0.13895039558410643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,power_law_1.2,1.405395221710205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,power_law_1.01,0.1512511968612671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,power_law_1.01,0.16106879711151123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,power_law_1.2,2.193484878540039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,power_law_1.01,0.1635200023651123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,power_law_1.01,0.1835968017578125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,power_law_1.2,4.310092926025391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,power_law_1.01,0.1778496026992798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,power_law_1.01,0.2052992105484009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,power_law_1.01,0.22346880435943603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,power_law_1.2,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,power_law_1.01,0.27779839038848875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,power_law_1.2,0.11503360271453858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,power_law_1.01,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,power_law_1.01,0.3343168020248413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,power_law_1.2,0.09598720073699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,power_law_1.01,0.11113599538803101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,power_law_1.2,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,power_law_1.01,0.4254464149475098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,power_law_1.01,0.11421439647674561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,power_law_1.2,0.08204159736633301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,power_law_1.01,0.5026495933532715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,power_law_1.01,0.11850880384445191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,power_law_1.2,0.08943359851837158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,power_law_1.01,0.7142144203186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,power_law_1.01,0.12547199726104735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,power_law_1.01,0.13304320573806763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,power_law_1.01,0.8694592475891113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,power_law_1.2,0.11667200326919555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,power_law_1.01,0.14287359714508058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,power_law_1.01,1.0736191749572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,power_law_1.01,0.14819200038909913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,power_law_1.2,0.11400320529937744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,power_law_1.01,1.6542463302612305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,power_law_1.01,0.1592512011528015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,power_law_1.2,0.11503360271453858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,power_law_1.01,0.1928447961807251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,power_law_1.2,0.1217919945716858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,power_law_1.01,3.251667022705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,power_law_1.01,0.2178112030029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,power_law_1.2,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,power_law_1.01,0.26698880195617675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,power_law_1.2,0.1303936004638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,power_law_1.01,0.3278143882751465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,power_law_1.2,0.13999999761581422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,power_law_1.01,0.4193408012390137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,power_law_1.01,0.06438400149345398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,power_law_1.2,0.15271040201187133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,power_law_1.01,0.5215551853179932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,power_law_1.01,0.08937600255012512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,power_law_1.2,0.15475840568542482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,power_law_1.01,0.674124813079834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,power_law_1.01,0.11864320039749146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,power_law_1.2,0.1576192021369934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,power_law_1.01,0.8568063735961914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,power_law_1.01,0.06500480175018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,power_law_1.2,0.189792001247406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,power_law_1.01,1.1658111572265626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,power_law_1.01,0.0803391993045807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,power_law_1.2,0.17934080362319946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,power_law_1.01,1.4628416061401368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,power_law_1.01,0.091839998960495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,power_law_1.2,0.21127679347991943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,power_law_1.01,1.7255615234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,power_law_1.01,0.10084480047225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,power_law_1.2,0.23607680797576905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,power_law_1.01,2.744825553894043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,power_law_1.01,0.11353600025177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,power_law_1.2,0.2923775911331177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,power_law_1.01,5.662847900390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,power_law_1.01,0.11968640089035035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,power_law_1.2,0.33948800563812254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,power_law_1.01,0.12276480197906495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,power_law_1.2,0.47479681968688964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,power_law_1.01,0.12665599584579468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,power_law_1.2,0.5174208164215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,power_law_1.01,0.13422720432281493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,power_law_1.2,0.7667007923126221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,power_law_1.01,0.13564800024032592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,power_law_1.2,0.06555520296096802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,power_law_1.2,1.0394432067871093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,power_law_1.2,0.08815360069274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,power_law_1.01,0.13955199718475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,power_law_1.2,1.3538623809814454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,power_law_1.2,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,power_law_1.01,0.15265920162200927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,power_law_1.2,1.9662208557128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,power_law_1.2,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,power_law_1.01,0.158406400680542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,power_law_1.2,3.8085887908935545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,power_law_1.2,0.07893760204315185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,power_law_1.01,0.17189760208129884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,power_law_1.2,0.09512320160865784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,power_law_1.01,0.18686720132827758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,power_law_1.2,0.09552000164985656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,power_law_1.01,0.19259519577026368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,power_law_1.2,0.1123263955116272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,power_law_1.01,0.24318079948425292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,power_law_1.2,0.11251840591430665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,power_law_1.01,0.2554624080657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,power_law_1.2,0.1192896008491516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,power_law_1.01,0.3058495998382568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,power_law_1.2,0.12788480520248413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,power_law_1.01,0.3529664039611816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,power_law_1.2,0.1346560001373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,power_law_1.01,0.46129279136657714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,power_law_1.2,0.14099839925765992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,power_law_1.01,0.58089599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,power_law_1.2,0.14467840194702147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,power_law_1.01,0.8125184059143067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,power_law_1.2,0.16085760593414306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,power_law_1.01,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,power_law_1.01,0.9988863945007325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,power_law_1.2,0.1579967975616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,power_law_1.01,1.1444992065429687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,power_law_1.2,0.16966400146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,power_law_1.01,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,power_law_1.2,0.18542720079421998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,power_law_1.01,1.7214336395263672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,power_law_1.01,0.0630016028881073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,power_law_1.2,0.20487680435180664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,power_law_1.01,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,power_law_1.01,3.4753345489501952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,power_law_1.2,0.2460416078567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,power_law_1.01,0.09987199902534485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,power_law_1.2,0.2716736078262329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,power_law_1.01,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,power_law_1.01,0.12178560495376586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,power_law_1.2,0.3329087972640991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,power_law_1.01,0.12814079523086547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,power_law_1.2,0.3931071996688843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,power_law_1.01,0.13100160360336305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,power_law_1.2,0.5010303974151611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,power_law_1.01,0.1312064051628113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,power_law_1.2,0.6863743782043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,power_law_1.01,0.14124159812927245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,power_law_1.2,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,power_law_1.2,0.8379327774047851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,power_law_1.2,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,power_law_1.01,0.14451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,power_law_1.2,1.076095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,power_law_1.01,0.15312000513076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,power_law_1.2,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,power_law_1.2,1.3701888084411622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,power_law_1.01,0.16743680238723754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,power_law_1.2,0.09434239864349366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,power_law_1.2,1.9333887100219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,power_law_1.01,0.16828160285949706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,power_law_1.2,0.09783040285110474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,power_law_1.01,0.1848703980445862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,power_law_1.2,0.11708159446716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,power_law_1.2,3.765740966796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,power_law_1.01,0.20616960525512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,power_law_1.2,0.12302080392837525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,power_law_1.01,0.21986560821533202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,power_law_1.2,0.1269055962562561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,power_law_1.01,0.267193603515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,power_law_1.2,0.136735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,power_law_1.01,0.30157439708709716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,power_law_1.2,0.1432960033416748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,power_law_1.01,0.3908799886703491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,power_law_1.2,0.14739199876785278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,power_law_1.2,0.1543552041053772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,power_law_1.01,0.45226240158081055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,power_law_1.2,0.16458879709243773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,power_law_1.01,0.6067584037780762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,power_law_1.2,0.17073919773101806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,power_law_1.01,0.7617856025695801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,power_law_1.2,0.19039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,power_law_1.01,1.0313023567199706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,power_law_1.2,0.21128320693969727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,power_law_1.01,1.3063424110412598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,power_law_1.2,0.22685439586639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,power_law_1.01,1.660857582092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,power_law_1.2,0.27538559436798093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,power_law_1.01,2.271353530883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,power_law_1.2,0.31693439483642577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,power_law_1.01,0.06355839967727661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,power_law_1.2,0.3998975992202759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,power_law_1.01,4.3658496856689455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,power_law_1.01,0.06500480175018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,power_law_1.2,0.4797760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,power_law_1.01,0.07339519858360291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,power_law_1.2,0.6104447841644287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,power_law_1.01,0.07442560195922851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,power_law_1.2,0.7740928173065186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,power_law_1.01,0.088755202293396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,power_law_1.2,1.0859904289245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,power_law_1.01,0.11253119707107544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,power_law_1.2,1.328371238708496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,power_law_1.01,0.11866879463195801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,power_law_1.2,1.634227180480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,power_law_1.01,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,power_law_1.01,0.14057600498199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,power_law_1.01,0.033504000306129454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,power_law_1.2,2.5312576293945312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,power_law_1.01,0.14958720207214354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,power_law_1.01,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,power_law_1.01,0.15777920484542846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,power_law_1.01,0.03432320058345795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,power_law_1.2,5.2186431884765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,power_law_1.01,0.16270079612731933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,power_law_1.01,0.03678080141544342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,power_law_1.01,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,power_law_1.01,0.17047040462493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,power_law_1.2,0.06398079991340637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,power_law_1.01,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,power_law_1.01,0.17744640111923218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,power_law_1.2,0.06583679914474487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,power_law_1.01,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,power_law_1.01,0.036595198512077334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,power_law_1.2,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,power_law_1.01,0.18624000549316405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,power_law_1.01,0.040268799662590025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,power_law_1.01,0.1966912031173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,power_law_1.01,0.04026240110397339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,power_law_1.01,0.20897281169891357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,power_law_1.01,0.0416703999042511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,power_law_1.2,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,power_law_1.01,0.04826880097389221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,power_law_1.2,0.033529600501060484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,power_law_1.01,0.2228991985321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,power_law_1.2,0.10350079536437988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,power_law_1.01,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,power_law_1.2,0.03353599905967712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,power_law_1.2,0.11437439918518066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,power_law_1.01,0.251366400718689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,power_law_1.01,0.05318400263786316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,power_law_1.2,0.033932799100875856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,power_law_1.01,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,power_law_1.2,0.14140160083770753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,power_law_1.01,0.2851583957672119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,power_law_1.2,0.03454720079898834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,power_law_1.01,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,power_law_1.2,0.14304640293121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,power_law_1.2,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,power_law_1.01,0.0822655975818634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,power_law_1.01,0.3531455993652344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,power_law_1.2,0.03475840091705322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,power_law_1.01,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,power_law_1.2,0.1524672031402588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,power_law_1.01,0.4014848232269287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,power_law_1.2,0.036595198512077334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,power_law_1.01,0.14471039772033692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,power_law_1.2,0.1631168007850647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,power_law_1.2,0.035776001214981076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,power_law_1.01,0.16949119567871093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,power_law_1.01,0.5210879802703857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,power_law_1.01,0.23299200534820558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,power_law_1.2,0.17211519479751586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,power_law_1.01,0.6548160076141357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,power_law_1.01,0.27803521156311034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,power_law_1.2,0.17354880571365355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,power_law_1.2,0.04173440039157868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,power_law_1.01,0.41483521461486816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,power_law_1.01,0.8559295654296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,power_law_1.2,0.04273920059204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,power_law_1.01,0.5850304126739502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,power_law_1.2,0.1856063961982727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,power_law_1.01,1.0933055877685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,power_law_1.2,0.047251200675964354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,power_law_1.01,0.7105792045593262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,power_law_1.2,0.20407679080963134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,power_law_1.2,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,power_law_1.01,1.5494015693664551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,power_law_1.01,1.0818752288818358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,power_law_1.2,0.052153599262237546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,power_law_1.2,0.21063039302825928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,power_law_1.01,2.178387260437012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,power_law_1.2,0.0611840009689331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,power_law_1.01,1.8074304580688476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,power_law_1.2,0.23293440341949462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,power_law_1.2,0.070796799659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,power_law_1.01,2.183238410949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,power_law_1.2,0.2732928037643433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,power_law_1.2,0.08678399920463561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,power_law_1.2,0.10398080348968505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,power_law_1.2,0.29419519901275637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,power_law_1.01,3.474099349975586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,power_law_1.2,0.14391039609909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,power_law_1.2,0.3601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,power_law_1.2,0.16785279512405396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,power_law_1.2,0.24160640239715575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,power_law_1.2,0.41235837936401365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,power_law_1.2,0.2710720062255859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,power_law_1.2,0.5260223865509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,power_law_1.2,0.41036162376403806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,power_law_1.01,0.03760640025138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,power_law_1.2,0.5789055824279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,power_law_1.2,0.6671232223510742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,power_law_1.01,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,power_law_1.2,0.7118015766143799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,power_law_1.01,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,power_law_1.2,0.8956671714782715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,power_law_1.2,1.12161283493042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,power_law_1.01,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,power_law_1.2,1.1215744018554688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,power_law_1.01,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,power_law_1.2,2.341542434692383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,power_law_1.01,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,power_law_1.2,1.5588095664978028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,power_law_1.01,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,power_law_1.2,1.8981632232666015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,power_law_1.01,0.03678080141544342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,power_law_1.01,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,power_law_1.2,2.2704896926879883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,power_law_1.01,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,power_law_1.01,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,power_law_1.2,3.5085121154785157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,power_law_1.01,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,power_law_1.2,6.623104095458984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,power_law_1.2,0.035571199655532834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,power_law_1.01,0.04620800018310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,power_law_1.01,0.04907520115375519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,power_law_1.2,0.033939200639724734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,power_law_1.01,0.05111039876937866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,power_law_1.01,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,power_law_1.2,0.03496319949626923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,power_law_1.01,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,power_law_1.2,0.035776001214981076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,power_law_1.01,0.08757759928703308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,power_law_1.01,0.09412479996681214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,power_law_1.2,0.03537279963493347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,power_law_1.01,0.12895359992980956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,power_law_1.01,0.16766719818115233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,power_law_1.01,0.2166208028793335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,power_law_1.01,0.03346560001373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,power_law_1.01,0.3403072118759155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,power_law_1.01,0.03368319869041443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,power_law_1.2,0.03946239948272705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,power_law_1.01,0.3611776113510132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,power_law_1.01,0.03451519906520843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,power_law_1.2,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,power_law_1.01,0.5465472221374512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,power_law_1.01,0.7765247821807861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,power_law_1.01,0.036345601081848145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,power_law_1.2,0.048256000876426695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,power_law_1.01,1.0773759841918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,power_law_1.01,0.038387200236320494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,power_law_1.01,2.1161279678344727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,power_law_1.01,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,power_law_1.01,0.037785598635673524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,power_law_1.2,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,power_law_1.01,0.038796800374984744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,power_law_1.2,0.07182719707489013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,power_law_1.01,0.039827200770378116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,power_law_1.2,0.09537280201911927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,power_law_1.01,0.03961600065231323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,power_law_1.2,0.10561920404434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,power_law_1.01,0.04002560079097748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,power_law_1.2,0.13305599689483644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,power_law_1.01,0.04166400134563446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,power_law_1.2,0.1865023970603943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,power_law_1.01,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,power_law_1.2,0.2583807945251465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,power_law_1.01,0.04963200092315674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,power_law_1.2,0.2960639953613281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,power_law_1.01,0.050271999835968015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,power_law_1.2,0.44291839599609373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,power_law_1.2,0.0322816014289856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,power_law_1.01,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,power_law_1.2,0.5268735885620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,power_law_1.2,0.03331199884414673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,power_law_1.01,0.058873599767684935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,power_law_1.2,0.6999296188354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,power_law_1.01,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,power_law_1.2,1.1879743576049804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,power_law_1.01,0.0850495994091034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,power_law_1.2,2.3678207397460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,power_law_1.01,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,power_law_1.2,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,power_law_1.01,0.13381760120391845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,power_law_1.2,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,power_law_1.01,0.1628991961479187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,power_law_1.2,0.036364799737930296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,power_law_1.01,0.20508160591125488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,power_law_1.2,0.03823359906673431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,power_law_1.01,0.2851648092269897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,power_law_1.2,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,power_law_1.01,0.37260799407958983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,power_law_1.2,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,power_law_1.01,0.5149568080902099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,power_law_1.2,0.03882879912853241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,power_law_1.01,0.6062655925750733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,power_law_1.01,0.9620223999023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,power_law_1.01,1.7898239135742187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,power_law_1.01,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,power_law_1.2,0.051744002103805545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,power_law_1.01,0.03658879995346069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,power_law_1.2,0.05338240265846252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,power_law_1.01,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,power_law_1.2,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,power_law_1.01,0.03700479865074158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,power_law_1.2,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,power_law_1.01,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,power_law_1.2,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,power_law_1.01,0.036800000071525577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,power_law_1.2,0.10643199682235718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,power_law_1.01,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,power_law_1.2,0.1297727942466736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,power_law_1.01,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,power_law_1.2,0.1662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,power_law_1.01,0.03844479918479919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,power_law_1.2,0.2182528018951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,power_law_1.2,0.296889591217041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,power_law_1.2,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,power_law_1.2,0.409932804107666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,power_law_1.2,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,power_law_1.01,0.04745599925518036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,power_law_1.2,0.551852798461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,power_law_1.2,0.037785598635673524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,power_law_1.01,0.047219198942184445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,power_law_1.2,0.7212287902832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,power_law_1.2,0.03777920007705689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,power_law_1.01,0.048467200994491574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,power_law_1.2,1.0427776336669923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,power_law_1.2,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,power_law_1.01,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,power_law_1.2,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,power_law_1.01,0.05994880199432373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,power_law_1.2,2.1538047790527344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,power_law_1.2,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,power_law_1.01,0.06462720036506653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,power_law_1.2,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,power_law_1.01,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,power_law_1.2,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,power_law_1.01,0.0925055980682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,power_law_1.2,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,power_law_1.01,0.1178879976272583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,power_law_1.2,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,power_law_1.01,0.13961600065231322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,power_law_1.2,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,power_law_1.01,0.1914240002632141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,power_law_1.2,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,power_law_1.01,0.24036478996276855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,power_law_1.2,0.04924800097942352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,power_law_1.01,0.33128321170806885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,power_law_1.2,0.05804799795150757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,power_law_1.01,0.43923201560974123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,power_law_1.2,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,power_law_1.01,0.6659264087677002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,power_law_1.01,0.03922559916973114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,power_law_1.2,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,power_law_1.01,0.8150272369384766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,power_law_1.01,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,power_law_1.2,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,power_law_1.01,1.0937664031982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,power_law_1.01,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,power_law_1.2,0.09246079921722412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,power_law_1.01,1.7083648681640624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,power_law_1.01,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,power_law_1.2,0.11868799924850464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,power_law_1.01,0.038227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,power_law_1.2,0.15164159536361693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,power_law_1.01,3.614432144165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,power_law_1.2,0.2091775894165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,power_law_1.2,0.2364351987838745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,power_law_1.01,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,power_law_1.2,0.33514881134033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,power_law_1.01,0.03882879912853241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,power_law_1.2,0.4211584091186523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,power_law_1.01,0.03964160084724426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,power_law_1.2,0.6164991855621338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,power_law_1.2,0.8067904472351074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,power_law_1.01,0.04190720021724701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,power_law_1.2,1.110912036895752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,power_law_1.01,0.04497919976711273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,power_law_1.2,1.6628480911254884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,power_law_1.01,0.04826880097389221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,power_law_1.01,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,power_law_1.2,3.4495105743408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,power_law_1.01,0.057068800926208495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,power_law_1.2,0.04172160029411316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,power_law_1.01,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,power_law_1.2,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,power_law_1.01,0.0756991982460022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,power_law_1.2,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,power_law_1.01,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,power_law_1.2,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,power_law_1.01,0.11626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,power_law_1.2,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,power_law_1.01,0.13059200048446656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,power_law_1.2,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,power_law_1.01,0.17319040298461913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,power_law_1.2,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,power_law_1.01,0.22193920612335205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,power_law_1.2,0.03904640078544617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,power_law_1.01,0.3583231925964355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,power_law_1.2,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,power_law_1.2,0.04090240001678467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,power_law_1.01,0.4171008110046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,power_law_1.2,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,power_law_1.01,0.5903615951538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,power_law_1.01,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,power_law_1.2,0.043961599469184875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,power_law_1.01,0.7986368179321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,power_law_1.01,0.037363201379776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,power_law_1.01,0.9670016288757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,power_law_1.01,0.036934399604797365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,power_law_1.2,0.04928640127182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,power_law_1.01,1.3079808235168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,power_law_1.01,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,power_law_1.01,3.6238590240478517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,power_law_1.01,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,power_law_1.2,0.06220160126686096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,power_law_1.01,0.0416703999042511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,power_law_1.2,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,power_law_1.01,0.04351359903812409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,power_law_1.2,0.08904320001602173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,power_law_1.01,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,power_law_1.2,0.11582720279693604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,power_law_1.01,0.04431360065937042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,power_law_1.2,0.1359231948852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,power_law_1.2,0.17153279781341552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,power_law_1.2,0.23503999710083007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,power_law_1.01,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,power_law_1.2,0.3104192018508911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,power_law_1.01,0.047814399003982544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,power_law_1.2,0.42899198532104493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,power_law_1.01,0.05373439788818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,power_law_1.2,0.5625279903411865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,power_law_1.01,0.05639680027961731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,power_law_1.2,0.8461631774902344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,power_law_1.2,0.0347135990858078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,power_law_1.01,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,power_law_1.2,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,power_law_1.2,1.1511039733886719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,power_law_1.2,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,power_law_1.2,1.6678207397460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,power_law_1.01,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,power_law_1.01,6.734540557861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,power_law_1.01,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,power_law_1.2,3.4393535614013673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,power_law_1.2,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,power_law_1.01,0.12789119482040406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,power_law_1.2,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,power_law_1.01,0.17620480060577393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,power_law_1.2,0.04129279851913452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,power_law_1.01,0.21511681079864503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,power_law_1.2,0.04149119853973389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,power_law_1.01,0.28558080196380614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,power_law_1.2,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,power_law_1.01,0.3646143913269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,power_law_1.2,0.04129279851913452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,power_law_1.01,0.5686016082763672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,power_law_1.2,0.0427264004945755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,power_law_1.2,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,power_law_1.01,0.734668779373169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,power_law_1.01,0.8567616462707519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,power_law_1.2,0.04702720046043396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,power_law_1.01,1.2571392059326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,power_law_1.2,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,power_law_1.2,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,power_law_1.01,2.809113693237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,power_law_1.2,0.059513598680496216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,power_law_1.2,0.09312639832496643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,power_law_1.2,0.05971199870109558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,power_law_1.2,0.08143360018730164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,power_law_1.2,0.09290879964828491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,power_law_1.2,0.0738752007484436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,power_law_1.2,0.1162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,power_law_1.2,0.13427200317382812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,power_law_1.2,0.0746944010257721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,power_law_1.2,0.1781056046485901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,power_law_1.2,0.2239680051803589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,power_law_1.2,0.07610880136489868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,power_law_1.2,0.2931839942932129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,power_law_1.2,0.0746944010257721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,power_law_1.2,0.3595648050308228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,power_law_1.2,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,power_law_1.2,0.5346687793731689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,power_law_1.01,0.10515199899673462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,power_law_1.2,0.7417024135589599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,power_law_1.2,0.08348159790039063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,power_law_1.01,0.08529919981956482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,power_law_1.2,0.903923225402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,power_law_1.2,0.08615040183067321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,power_law_1.01,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,power_law_1.2,1.4464256286621093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,power_law_1.2,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,power_law_1.01,0.06358399987220764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,power_law_1.2,2.821855926513672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,power_law_1.2,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,power_law_1.01,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,power_law_1.2,0.09434880018234253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,power_law_1.01,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,power_law_1.2,0.10520319938659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,power_law_1.01,0.07914239764213563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,power_law_1.01,0.08160640001296997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,power_law_1.2,0.10929280519485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,power_law_1.01,0.08180480003356934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,power_law_1.2,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,power_law_1.01,0.0834496021270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,power_law_1.2,0.13715840578079225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,power_law_1.2,0.15620479583740235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,power_law_1.01,0.0859008014202118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,power_law_1.2,0.18097280263900756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,power_law_1.01,0.09267200231552124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,power_law_1.2,0.08594560027122497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,power_law_1.2,0.21040000915527343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,power_law_1.2,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,power_law_1.01,0.09758080244064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,power_law_1.2,0.26330881118774413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,power_law_1.2,0.05767679810523987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,power_law_1.01,0.1045375943183899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,power_law_1.2,0.3194175958633423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,power_law_1.01,0.11273599863052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,power_law_1.2,0.44579200744628905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,power_law_1.2,0.06466559767723083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,power_law_1.01,0.1123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,power_law_1.2,0.5629248142242431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,power_law_1.2,0.0673088014125824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,power_law_1.01,0.1254271984100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,power_law_1.2,0.8455488204956054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,power_law_1.2,0.07735040187835693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,power_law_1.01,0.1366976022720337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,power_law_1.2,1.2424575805664062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,power_law_1.01,0.16311039924621581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,power_law_1.2,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,power_law_1.2,1.4132543563842774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,power_law_1.2,0.0804095983505249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,power_law_1.01,0.18360960483551025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,power_law_1.2,2.184940719604492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,power_law_1.2,0.08266879916191101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,power_law_1.01,0.23745920658111572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,power_law_1.2,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,power_law_1.01,0.2847615957260132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,power_law_1.2,5.649951934814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,power_law_1.2,0.0883840024471283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,power_law_1.01,0.3961535930633545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,power_law_1.2,0.09166719913482665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,power_law_1.01,0.4834047794342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,power_law_1.2,0.09371520280838012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,power_law_1.01,0.6978432178497315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,power_law_1.2,0.10006400346755981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,power_law_1.01,0.8911680221557617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,power_law_1.2,0.10703999996185302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,power_law_1.01,1.0650367736816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,power_law_1.2,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,power_law_1.2,0.12997759580612184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,power_law_1.01,1.668172836303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,power_law_1.2,0.13551360368728638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,power_law_1.01,3.3598270416259766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,power_law_1.01,0.0750976026058197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,power_law_1.2,0.1682752013206482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,power_law_1.01,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,power_law_1.2,0.19202560186386108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,power_law_1.01,0.060761600732803345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,power_law_1.2,0.24240639209747314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,power_law_1.2,0.2972287893295288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,power_law_1.2,0.4313727855682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,power_law_1.01,0.06977279782295227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,power_law_1.2,0.5129471778869629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,power_law_1.01,0.07938560247421264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,power_law_1.2,0.7290112018585205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,power_law_1.01,0.07939839959144593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,power_law_1.2,0.9854207992553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,power_law_1.01,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,power_law_1.2,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,power_law_1.2,1.1502911567687988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,power_law_1.01,0.08266239762306213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,power_law_1.2,0.09122560024261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,power_law_1.2,1.9625280380249024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,power_law_1.01,0.08657280206680298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,power_law_1.2,0.05722879767417908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,power_law_1.01,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,power_law_1.2,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,power_law_1.2,4.165568161010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,power_law_1.01,0.09373440146446228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,power_law_1.2,0.06440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,power_law_1.01,0.10008319616317748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,power_law_1.2,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,power_law_1.01,0.1074560046195984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,power_law_1.2,0.07832319736480713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,power_law_1.01,0.11237119436264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,power_law_1.2,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,power_law_1.01,0.11400959491729737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,power_law_1.2,0.08199679851531982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,power_law_1.01,0.134278404712677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,power_law_1.2,0.08672639727592468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,power_law_1.01,0.1469696044921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,power_law_1.2,0.08792960047721862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,power_law_1.01,0.16766079664230346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,power_law_1.2,0.09164159893989562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,power_law_1.01,0.19511040449142455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,power_law_1.2,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,power_law_1.01,0.24078080654144288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,power_law_1.2,0.10331519842147827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,power_law_1.01,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,power_law_1.01,0.2981247901916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,power_law_1.2,0.11253119707107544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,power_law_1.01,0.07344639897346497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,power_law_1.2,0.11518720388412476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,power_law_1.01,0.3882431983947754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,power_law_1.2,0.11806080341339112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,power_law_1.01,0.508454418182373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,power_law_1.01,0.06302080154418946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,power_law_1.2,0.13608319759368898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,power_law_1.01,0.07017599940299987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,power_law_1.01,0.6925759792327881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,power_law_1.2,0.14407039880752565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,power_law_1.01,0.07528960108757018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,power_law_1.01,0.8957311630249023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,power_law_1.2,0.17356159687042236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,power_law_1.01,0.08511360287666321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,power_law_1.01,1.076140785217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,power_law_1.01,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,power_law_1.2,0.20161919593811034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,power_law_1.01,1.7939840316772462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,power_law_1.01,0.08737279772758484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,power_law_1.2,0.2511807918548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,power_law_1.01,0.0925055980682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,power_law_1.01,3.2591167449951173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,power_law_1.2,0.3165055990219116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,power_law_1.01,0.09413759708404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,power_law_1.2,0.4170623779296875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,power_law_1.01,0.095769602060318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,power_law_1.2,0.5419904232025147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,power_law_1.01,0.09639679789543151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,power_law_1.2,0.7691199779510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,power_law_1.01,0.10396800041198731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,power_law_1.2,1.034118366241455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,power_law_1.01,0.10926079750061035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,power_law_1.2,1.2292863845825195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,power_law_1.01,0.11788159608840942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,power_law_1.2,2.0714303970336916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,power_law_1.01,0.12158080339431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,power_law_1.01,0.1379583954811096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,power_law_1.2,4.141747283935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,power_law_1.01,0.15516799688339233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,power_law_1.2,0.06977919936180114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,power_law_1.01,0.19157760143280028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,power_law_1.2,0.07203840017318726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,power_law_1.01,0.21208319664001465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,power_law_1.2,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,power_law_1.01,0.27497599124908445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,power_law_1.2,0.06261119842529297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,power_law_1.01,0.34010241031646726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,power_law_1.2,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,power_law_1.01,0.4355455875396729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,power_law_1.2,0.07795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,power_law_1.01,0.5711040019989013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,power_law_1.2,0.08737279772758484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,power_law_1.01,0.7732607841491699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,power_law_1.2,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,power_law_1.01,0.9948351860046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,power_law_1.2,0.09043840169906617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,power_law_1.01,1.2989567756652831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,power_law_1.2,0.09455360174179077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,power_law_1.01,1.870150375366211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,power_law_1.2,0.09475839734077454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,power_law_1.2,0.09946879744529724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,power_law_1.01,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,power_law_1.01,3.9224575042724608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,power_law_1.2,0.09700480103492737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,power_law_1.01,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,power_law_1.2,0.10460799932479858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,power_law_1.01,0.06419199705123901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,power_law_1.2,0.11421439647674561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,power_law_1.01,0.07013760209083557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,power_law_1.2,0.11829119920730591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,power_law_1.01,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,power_law_1.2,0.12424319982528687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,power_law_1.01,0.09059200286865235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,power_law_1.2,0.1479871988296509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,power_law_1.01,0.10451840162277222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,power_law_1.2,0.1572224020957947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,power_law_1.01,0.11436159610748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,power_law_1.01,0.1041152000427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,power_law_1.2,0.19592959880828859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,power_law_1.01,0.10984959602355956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,power_law_1.01,0.09224320054054261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,power_law_1.2,0.2297152042388916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,power_law_1.01,0.11436159610748291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,power_law_1.01,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,power_law_1.01,0.12070399522781372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,power_law_1.2,0.28748159408569335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,power_law_1.01,0.0662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,power_law_1.01,0.12440320253372192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,power_law_1.2,0.3341759920120239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,power_law_1.01,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,power_law_1.01,0.12891520261764527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,power_law_1.2,0.4650239944458008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,power_law_1.01,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,power_law_1.2,0.06914560198783874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,power_law_1.01,0.13095680475234986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,power_law_1.2,0.5833983898162842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,power_law_1.01,0.07585920095443725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,power_law_1.2,0.06709120273590088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,power_law_1.01,0.14140160083770753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,power_law_1.01,0.08220800161361694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,power_law_1.2,0.8433024406433105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,power_law_1.01,0.14281599521636962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,power_law_1.01,0.08036479949951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,power_law_1.2,1.1142399787902832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,power_law_1.01,0.14693119525909423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,power_law_1.01,0.08487039804458618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,power_law_1.2,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,power_law_1.2,1.401375961303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,power_law_1.01,0.16925439834594727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,power_law_1.01,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,power_law_1.2,0.08549759984016418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,power_law_1.2,1.9875072479248046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,power_law_1.01,0.18810240030288697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,power_law_1.01,0.09040639996528625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,power_law_1.2,0.1029312014579773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,power_law_1.01,0.22803840637207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,power_law_1.01,0.0899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,power_law_1.2,0.10520319938659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,power_law_1.2,3.9996353149414063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,power_law_1.01,0.2718400001525879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,power_law_1.01,0.09427840113639832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,power_law_1.2,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,power_law_1.01,0.3462080001831055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,power_law_1.2,0.1142016053199768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,power_law_1.01,0.10718079805374145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,power_law_1.01,0.41420159339904783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,power_law_1.2,0.11749119758605957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,power_law_1.01,0.10698879957199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,power_law_1.2,0.1285375952720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,power_law_1.01,0.11108479499816895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,power_law_1.01,0.5387072086334228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,power_law_1.2,0.12651519775390624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,power_law_1.01,0.12685439586639405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,power_law_1.01,0.7105343818664551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,power_law_1.2,0.1344831943511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,power_law_1.01,0.1356608033180237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,power_law_1.01,0.9673664093017578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,power_law_1.2,0.14737919569015503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,power_law_1.01,0.16433919668197633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,power_law_1.01,1.25796480178833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,power_law_1.2,0.14737279415130616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,power_law_1.01,0.18112640380859374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,power_law_1.01,1.5076031684875488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,power_law_1.2,0.16867200136184693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,power_law_1.01,0.23826560974121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,power_law_1.01,2.3849727630615236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,power_law_1.2,0.187718403339386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,power_law_1.01,0.2763583898544312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,power_law_1.2,0.19407360553741454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,power_law_1.01,0.39842560291290285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,power_law_1.01,4.606643295288086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,power_law_1.2,0.23461759090423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,power_law_1.01,0.4891520023345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,power_law_1.2,0.28275198936462403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,power_law_1.01,0.6896448135375977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,power_law_1.2,0.35300478935241697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,power_law_1.01,0.8743743896484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,power_law_1.2,0.4400383949279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,power_law_1.01,1.2026687622070313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,power_law_1.2,0.5920000076293945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,power_law_1.01,1.7103616714477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,power_law_1.2,0.7216447830200196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,power_law_1.01,0.06321920156478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,power_law_1.2,1.0104127883911134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,power_law_1.01,3.468761444091797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,power_law_1.01,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,power_law_1.2,1.2920063972473144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,power_law_1.01,0.06444799900054932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,power_law_1.01,0.0798143982887268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,power_law_1.2,1.6567487716674805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,power_law_1.01,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,power_law_1.2,2.407551956176758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,power_law_1.01,0.1359231948852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,power_law_1.2,4.910617446899414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,power_law_1.01,0.14001920223236083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,power_law_1.01,0.04184960126876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,power_law_1.01,0.14371199607849122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,power_law_1.01,0.04017919898033142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,power_law_1.01,0.0414463996887207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,power_law_1.01,0.15189759731292723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,power_law_1.01,0.0406464010477066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,power_law_1.01,0.16499840021133422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,power_law_1.01,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,power_law_1.01,0.17851519584655762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,power_law_1.01,0.1805567979812622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,power_law_1.2,0.06378239989280701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,power_law_1.2,0.04149760007858276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,power_law_1.01,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,power_law_1.01,0.17626240253448486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,power_law_1.2,0.07032960057258605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,power_law_1.2,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,power_law_1.01,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,power_law_1.01,0.19571839570999144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,power_law_1.2,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,power_law_1.2,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,power_law_1.01,0.20040318965911866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,power_law_1.2,0.07832319736480713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,power_law_1.01,0.19857920408248902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,power_law_1.2,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,power_law_1.2,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,power_law_1.01,0.041043201088905336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,power_law_1.01,0.22398080825805664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,power_law_1.2,0.03944959938526153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,power_law_1.2,0.10392320156097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,power_law_1.01,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,power_law_1.01,0.25102720260620115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,power_law_1.01,0.04552960097789764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,power_law_1.2,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,power_law_1.01,0.31122560501098634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,power_law_1.01,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,power_law_1.2,0.039059200882911684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,power_law_1.01,0.3685760021209717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,power_law_1.01,0.048614400625228885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,power_law_1.2,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,power_law_1.01,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,power_law_1.01,0.485913610458374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,power_law_1.2,0.04188799858093262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,power_law_1.01,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,power_law_1.01,0.6276351928710937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,power_law_1.2,0.04436480104923248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,power_law_1.01,0.7937344074249267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,power_law_1.2,0.04661760032176972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,power_law_1.01,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,power_law_1.01,0.959603214263916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,power_law_1.01,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,power_law_1.2,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,power_law_1.01,1.3780223846435546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,power_law_1.01,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,power_law_1.01,1.6735679626464843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,power_law_1.01,0.13112319707870485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,power_law_1.2,0.054604798555374146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,power_law_1.01,0.14917759895324706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,power_law_1.01,2.108127975463867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,power_law_1.2,0.061766397953033444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,power_law_1.01,0.21081600189208985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,power_law_1.01,3.2427135467529298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,power_law_1.2,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,power_law_1.01,0.2552639961242676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,power_law_1.2,0.08840320110321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,power_law_1.01,0.38429439067840576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,power_law_1.01,6.056684875488282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,power_law_1.2,0.10805120468139648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,power_law_1.01,0.45306878089904784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,power_law_1.2,0.13714560270309448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,power_law_1.2,0.1785215973854065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,power_law_1.01,0.5870463848114014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,power_law_1.2,0.26166400909423826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,power_law_1.01,0.9710335731506348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,power_law_1.2,0.3173759937286377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,power_law_1.01,1.942406463623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,power_law_1.2,0.4453567981719971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,power_law_1.2,0.7376128196716308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,power_law_1.01,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,power_law_1.2,0.8699199676513671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,power_law_1.2,1.5146112442016602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,power_law_1.01,0.034355199337005614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,power_law_1.01,0.03557760119438171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,power_law_1.2,3.3639678955078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,power_law_1.01,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,power_law_1.2,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,power_law_1.01,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,power_law_1.2,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,power_law_1.01,0.03945600092411041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,power_law_1.2,0.03776639997959137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,power_law_1.01,0.03945600092411041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,power_law_1.01,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,power_law_1.2,0.03694719970226288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,power_law_1.01,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,power_law_1.2,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,power_law_1.01,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,power_law_1.2,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,power_law_1.01,0.05132160186767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,power_law_1.01,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,power_law_1.2,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,power_law_1.01,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,power_law_1.01,0.04499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,power_law_1.01,0.03412480056285858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,power_law_1.01,0.049292799830436704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,power_law_1.2,0.038975998759269714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,power_law_1.01,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,power_law_1.01,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,power_law_1.2,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,power_law_1.01,0.036582401394844054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,power_law_1.01,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,power_law_1.2,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,power_law_1.01,0.04168959856033325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,power_law_1.2,0.04349440038204193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,power_law_1.01,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,power_law_1.2,0.044921600818634035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,power_law_1.01,0.08165119886398316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,power_law_1.2,0.044326400756835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,power_law_1.01,0.096806401014328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,power_law_1.01,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,power_law_1.2,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,power_law_1.01,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,power_law_1.01,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,power_law_1.2,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,power_law_1.01,0.14677759408950805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,power_law_1.01,0.0456063985824585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,power_law_1.2,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,power_law_1.01,0.2030911922454834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,power_law_1.01,0.04702079892158508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,power_law_1.2,0.06275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,power_law_1.01,0.044787201285362246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,power_law_1.01,0.25347199440002444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,power_law_1.2,0.0705344021320343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,power_law_1.01,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,power_law_1.01,0.37185280323028563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,power_law_1.2,0.09182720184326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,power_law_1.01,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,power_law_1.2,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,power_law_1.01,0.5105152130126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,power_law_1.01,0.056454402208328244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,power_law_1.2,0.13667839765548706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,power_law_1.01,0.5809599876403808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,power_law_1.01,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,power_law_1.2,0.16146559715270997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,power_law_1.01,0.8920191764831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,power_law_1.01,0.06855040192604064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,power_law_1.2,0.24338560104370116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,power_law_1.01,0.08512639999389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,power_law_1.01,1.832499122619629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,power_law_1.2,0.3166912078857422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,power_law_1.01,0.1076416015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,power_law_1.2,0.4379456043243408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,power_law_1.01,0.12668800354003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,power_law_1.2,0.6417088031768798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,power_law_1.01,0.14942079782485962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,power_law_1.2,0.7637760162353515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,power_law_1.01,0.2035072088241577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,power_law_1.01,0.2567552089691162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,power_law_1.2,1.2296383857727051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,power_law_1.01,0.3595648050308228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,power_law_1.2,3.0302976608276366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,power_law_1.01,0.44086399078369143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,power_law_1.2,0.0456063985824585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,power_law_1.2,0.034560000896453856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,power_law_1.01,0.5448895931243897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,power_law_1.01,0.9547072410583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,power_law_1.2,0.034694400429725644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,power_law_1.2,0.036185601353645326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,power_law_1.01,1.7792255401611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,power_law_1.2,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,power_law_1.2,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,power_law_1.01,0.04469760060310364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,power_law_1.2,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,power_law_1.01,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,power_law_1.2,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,power_law_1.01,0.03591679930686951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,power_law_1.2,0.045817598700523376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,power_law_1.01,0.038387200236320494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,power_law_1.2,0.04642559885978699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,power_law_1.01,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,power_law_1.2,0.047654399275779726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,power_law_1.2,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,power_law_1.01,0.042483198642730716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,power_law_1.2,0.052985602617263795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,power_law_1.2,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,power_law_1.01,0.043884798884391785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,power_law_1.2,0.05399680137634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,power_law_1.2,0.03616639971733093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,power_law_1.2,0.05564799904823303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,power_law_1.2,0.06322559714317322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,power_law_1.01,0.044940799474716187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,power_law_1.2,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,power_law_1.01,0.04635519981384277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,power_law_1.2,0.09271039962768554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,power_law_1.01,0.047603198885917665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,power_law_1.2,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,power_law_1.2,0.10540800094604492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,power_law_1.2,0.04373759925365448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,power_law_1.01,0.04943360090255737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,power_law_1.2,0.1461632013320923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,power_law_1.01,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,power_law_1.2,0.0449535995721817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,power_law_1.01,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,power_law_1.2,0.16521600484848023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,power_law_1.2,0.04744960069656372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,power_law_1.01,0.05783680081367493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,power_law_1.2,0.23585920333862304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,power_law_1.01,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,power_law_1.2,0.3059007883071899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,power_law_1.01,0.060096001625061034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,power_law_1.2,0.41361279487609864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,power_law_1.2,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,power_law_1.01,0.07032319903373718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,power_law_1.2,0.5727551937103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,power_law_1.2,0.05665919780731201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,power_law_1.01,0.07975040078163147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,power_law_1.2,0.8064448356628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,power_law_1.2,0.058713597059249875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,power_law_1.01,0.09592959880828858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,power_law_1.2,1.2199295997619628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,power_law_1.2,0.060761600732803345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,power_law_1.01,0.1182528018951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,power_law_1.2,0.0756928026676178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,power_law_1.01,0.1446720004081726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,power_law_1.2,2.6238271713256838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,power_law_1.2,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,power_law_1.01,0.17191040515899658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,power_law_1.2,0.09904639720916748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,power_law_1.01,0.2534208059310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,power_law_1.2,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,power_law_1.01,0.3081023931503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,power_law_1.2,0.14984320402145385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,power_law_1.01,0.4313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,power_law_1.2,0.1832128047943115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,power_law_1.01,0.5288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,power_law_1.2,0.2723072052001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,power_law_1.01,0.6486911773681641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,power_law_1.2,0.3312959909439087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,power_law_1.01,1.0650367736816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,power_law_1.2,0.4924736022949219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,power_law_1.2,0.6585087776184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,power_law_1.01,2.125907135009766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,power_law_1.01,0.04579200148582459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,power_law_1.2,0.7482560157775879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,power_law_1.2,1.272755241394043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,power_law_1.01,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,power_law_1.01,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,power_law_1.2,2.711884880065918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,power_law_1.01,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,power_law_1.01,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,power_law_1.01,0.0515392005443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,power_law_1.01,0.051545602083206174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,power_law_1.01,0.05542399883270264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,power_law_1.2,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,power_law_1.01,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,power_law_1.2,0.0357120007276535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,power_law_1.2,0.143231999874115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,power_law_1.01,0.05829120278358459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,power_law_1.2,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,power_law_1.2,0.15041919946670532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,power_law_1.01,0.059334397315979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,power_law_1.2,0.03940480053424835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,power_law_1.2,0.15082240104675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,power_law_1.01,0.06362879872322083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,power_law_1.2,0.04288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,power_law_1.01,0.06567040085792542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,power_law_1.2,0.15041919946670532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,power_law_1.2,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,power_law_1.01,0.0691648006439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,power_law_1.2,0.15512959957122802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,power_law_1.2,0.05190399885177612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,power_law_1.01,0.08430079817771911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,power_law_1.2,0.16024320125579833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,power_law_1.2,0.05311999917030334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,power_law_1.01,0.09783040285110474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,power_law_1.2,0.19506560564041137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,power_law_1.01,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,power_law_1.2,0.053932797908782956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,power_law_1.01,0.11422079801559448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,power_law_1.2,0.21472640037536622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,power_law_1.2,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,power_law_1.01,0.1351040005683899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,power_law_1.01,0.04088320136070252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,power_law_1.2,0.21942400932312012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,power_law_1.2,0.05354239940643311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,power_law_1.01,0.18056960105895997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,power_law_1.01,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,power_law_1.2,0.22782719135284424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,power_law_1.2,0.0529151976108551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,power_law_1.01,0.2123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,power_law_1.01,0.049055999517440795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,power_law_1.2,0.26735360622406007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,power_law_1.2,0.05578240156173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,power_law_1.01,0.29894399642944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,power_law_1.01,0.06177279949188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,power_law_1.2,0.2724800109863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,power_law_1.01,0.39273600578308104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,power_law_1.2,0.33678081035614016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,power_law_1.2,0.06541439890861511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,power_law_1.01,0.5121344089508056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,power_law_1.01,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,power_law_1.2,0.0713599979877472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,power_law_1.01,0.661414384841919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,power_law_1.2,0.07051519751548767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,power_law_1.01,0.06872959733009339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,power_law_1.01,0.8187135696411133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,power_law_1.2,0.08528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,power_law_1.01,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,power_law_1.01,1.2940671920776368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,power_law_1.2,0.10003199577331542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,power_law_1.2,0.12889599800109863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,power_law_1.01,0.0847104012966156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,power_law_1.01,2.704947280883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,power_law_1.2,0.14467840194702147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,power_law_1.01,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,power_law_1.2,0.17907840013504028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,power_law_1.01,0.08751360177993775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,power_law_1.2,0.2241152048110962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,power_law_1.01,0.09535999894142151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,power_law_1.01,0.09617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,power_law_1.2,0.2970495939254761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,power_law_1.01,0.11666560173034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,power_law_1.2,0.3933056116104126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,power_law_1.01,0.13304320573806763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,power_law_1.2,0.5792640209197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,power_law_1.01,0.1596351981163025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,power_law_1.2,0.7232319831848144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,power_law_1.01,0.19571839570999144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,power_law_1.2,0.929248046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,power_law_1.01,0.24445440769195556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,power_law_1.2,1.4680831909179688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,power_law_1.01,0.3153215885162354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,power_law_1.01,0.42098560333251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,power_law_1.2,3.1587072372436524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,power_law_1.01,0.5645567893981933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,power_law_1.01,0.7809599876403809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,power_law_1.01,0.9530688285827636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,power_law_1.01,1.1334976196289062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,power_law_1.2,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,power_law_1.01,1.7767679214477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,power_law_1.2,0.044377601146698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,power_law_1.01,3.378316879272461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,power_law_1.2,0.06339200139045716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,power_law_1.01,0.0797439992427826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,power_law_1.01,0.07953919768333435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,power_law_1.2,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,power_law_1.01,0.05619199872016907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,power_law_1.2,0.07242239713668823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,power_law_1.01,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,power_law_1.2,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,power_law_1.01,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,power_law_1.01,0.06500480175018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,power_law_1.2,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,power_law_1.01,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,power_law_1.2,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,power_law_1.01,0.07339519858360291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,power_law_1.2,0.08615040183067321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,power_law_1.2,0.05459840297698974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,power_law_1.01,0.07094399929046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,power_law_1.2,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,power_law_1.01,0.07503359913825988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,power_law_1.2,0.09987840056419373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,power_law_1.2,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,power_law_1.01,0.0797439992427826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,power_law_1.2,0.1133952021598816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,power_law_1.2,0.05952640175819397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,power_law_1.01,0.08097280263900757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,power_law_1.2,0.13715200424194335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,power_law_1.2,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,power_law_1.01,0.08488960266113281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,power_law_1.2,0.1613119959831238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,power_law_1.2,0.19655040502548218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,power_law_1.2,0.06835200190544129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,power_law_1.01,0.0850816011428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,power_law_1.2,0.2612607955932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,power_law_1.01,0.09182720184326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,power_law_1.2,0.30716800689697266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,power_law_1.01,0.09552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,power_law_1.2,0.4551936149597168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,power_law_1.01,0.09959040284156799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,power_law_1.01,0.11354240179061889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,power_law_1.2,0.5407872200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,power_law_1.01,0.11845120191574096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,power_law_1.2,0.8424768447875977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,power_law_1.01,0.14753279685974122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,power_law_1.2,1.0034560203552245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,power_law_1.01,0.16187520027160646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,power_law_1.2,1.2330431938171387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,power_law_1.01,0.21758079528808594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,power_law_1.2,2.0133184432983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,power_law_1.01,0.2460416078567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,power_law_1.01,0.35827839374542236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,power_law_1.2,3.6611392974853514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,power_law_1.01,0.43097600936889646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,power_law_1.01,0.65032958984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,power_law_1.01,0.7719423770904541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,power_law_1.01,0.9898816108703613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,power_law_1.01,1.5710975646972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,power_law_1.01,3.1253311157226564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,power_law_1.01,0.07278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,power_law_1.01,0.06711680293083191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,power_law_1.01,0.049907198548316954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,power_law_1.01,0.05891839861869812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,power_law_1.01,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,power_law_1.01,0.06833919882774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,power_law_1.01,0.06977279782295227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,power_law_1.01,0.07223039865493774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,power_law_1.2,0.07441920042037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,power_law_1.01,0.07263360023498536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,power_law_1.01,0.07445759773254394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,power_law_1.2,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,power_law_1.01,0.07899519801139832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,power_law_1.2,0.05292159914970398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,power_law_1.01,0.08452479839324951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,power_law_1.2,0.0559935986995697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,power_law_1.01,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,power_law_1.2,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,power_law_1.01,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,power_law_1.2,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,power_law_1.01,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,power_law_1.2,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,power_law_1.01,0.09884799718856811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,power_law_1.2,0.07157120108604431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,power_law_1.01,0.09824640154838563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,power_law_1.2,0.07464960217475891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,power_law_1.01,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,power_law_1.2,0.07504000067710877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,power_law_1.01,0.1269055962562561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,power_law_1.2,0.08180480003356934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,power_law_1.01,0.14860160350799562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,power_law_1.01,0.1709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,power_law_1.2,0.08630399703979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,power_law_1.01,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,power_law_1.2,0.09060479998588562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,power_law_1.01,0.26474239826202395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,power_law_1.2,0.09592959880828858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,power_law_1.01,0.3456383943557739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,power_law_1.2,0.10576000213623046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,power_law_1.01,0.4511040210723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,power_law_1.2,0.10535039901733398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,power_law_1.2,0.11928319931030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,power_law_1.01,0.6401343822479248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,power_law_1.2,0.12906240224838256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,power_law_1.01,0.8306048393249512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,power_law_1.2,0.1559424042701721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,power_law_1.01,1.0444095611572266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,power_law_1.2,0.18952959775924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,power_law_1.01,1.6239999771118163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,power_law_1.2,0.23928959369659425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,power_law_1.2,0.2876159906387329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,power_law_1.01,3.061836814880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,power_law_1.2,0.3748608112335205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,power_law_1.2,0.5116672039031982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,power_law_1.2,0.7658368110656738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,power_law_1.2,0.9960191726684571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,power_law_1.2,1.31080322265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,power_law_1.2,1.9665664672851562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,power_law_1.2,3.765919876098633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,power_law_1.01,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,power_law_1.01,0.06465920209884643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,power_law_1.01,0.055238401889801024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,power_law_1.01,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,power_law_1.01,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,power_law_1.01,0.07325440049171447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,power_law_1.01,0.07420799732208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,power_law_1.01,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,power_law_1.01,0.07817599773406983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,power_law_1.01,0.07980800271034241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,power_law_1.2,0.0670527994632721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,power_law_1.01,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,power_law_1.2,0.05598719716072083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,power_law_1.01,0.0873856008052826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,power_law_1.2,0.05496960282325745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,power_law_1.01,0.08963199853897094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,power_law_1.2,0.3904383897781372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,power_law_1.01,0.09107840061187744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,power_law_1.2,0.06313599944114685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,power_law_1.2,0.4973311901092529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,power_law_1.01,0.09986559748649597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,power_law_1.2,0.07278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,power_law_1.2,0.5702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,power_law_1.01,0.10254080295562744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,power_law_1.2,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,power_law_1.2,0.7711679935455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,power_law_1.01,0.11093120574951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,power_law_1.2,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,power_law_1.01,0.12527999877929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,power_law_1.2,0.9825152397155762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,power_law_1.2,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,power_law_1.01,0.14042880535125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,power_law_1.2,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,power_law_1.2,1.3910783767700194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,power_law_1.01,0.16092159748077392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,power_law_1.2,0.08609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,power_law_1.2,1.7533695220947265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,power_law_1.01,0.19434880018234252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,power_law_1.2,0.09367039799690247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,power_law_1.2,2.1205759048461914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,power_law_1.01,0.24488320350646972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,power_law_1.2,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,power_law_1.01,0.2977216005325317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,power_law_1.2,0.09839360117912292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,power_law_1.2,3.2405567169189453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,power_law_1.01,0.39231998920440675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,power_law_1.2,0.10902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,power_law_1.2,6.383699035644531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,power_law_1.2,0.11088000535964966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,power_law_1.01,0.5031295776367187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,power_law_1.2,0.11272959709167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,power_law_1.01,0.6835584163665771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,power_law_1.2,0.12910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,power_law_1.01,0.873196792602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,power_law_1.2,0.14835840463638306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,power_law_1.01,1.1203968048095703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,power_law_1.2,0.16596479415893556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,power_law_1.01,1.7038656234741212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,power_law_1.2,0.19096319675445556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,power_law_1.2,0.25033600330352784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,power_law_1.01,3.538457489013672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,power_law_1.2,0.3140352010726929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,power_law_1.2,0.429747200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,power_law_1.2,0.5067584037780761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,power_law_1.2,0.7895808219909668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,power_law_1.2,1.0172351837158202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,power_law_1.2,1.2284735679626464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,power_law_1.01,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,power_law_1.2,1.8774784088134766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,power_law_1.01,0.060089600086212155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,power_law_1.01,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,power_law_1.2,3.969504165649414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,power_law_1.01,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,power_law_1.01,0.07056000232696533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,power_law_1.01,0.07995520234107971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,power_law_1.01,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,power_law_1.2,0.06627839803695679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,power_law_1.01,0.08979200124740601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,power_law_1.2,0.0546239972114563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,power_law_1.01,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,power_law_1.2,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,power_law_1.01,0.09343360066413879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,power_law_1.2,0.058303999900817874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,power_law_1.01,0.09882240295410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,power_law_1.01,0.10146559476852417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,power_law_1.2,0.0822655975818634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,power_law_1.01,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,power_law_1.2,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,power_law_1.01,0.11519360542297363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,power_law_1.2,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,power_law_1.01,0.12296960353851319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,power_law_1.2,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,power_law_1.2,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,power_law_1.01,0.12993279695510865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,power_law_1.2,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,power_law_1.01,0.1319808006286621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,power_law_1.2,0.09824000000953674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,power_law_1.01,0.15238399505615235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,power_law_1.2,0.10417280197143555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,power_law_1.01,0.16595840454101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,power_law_1.2,0.10090240240097045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,power_law_1.2,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,power_law_1.01,0.19137279987335204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,power_law_1.2,0.1164736032485962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,power_law_1.2,0.08553599715232849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,power_law_1.01,0.23213438987731932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,power_law_1.2,0.12076799869537354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,power_law_1.01,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,power_law_1.2,0.09413759708404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,power_law_1.01,0.30113921165466306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,power_law_1.2,0.1314239978790283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,power_law_1.01,0.06253439784049988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,power_law_1.01,0.3715903997421265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,power_law_1.2,0.13078399896621704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,power_law_1.01,0.06275200247764587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,power_law_1.2,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,power_law_1.01,0.48423042297363283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,power_law_1.2,0.1486080050468445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,power_law_1.01,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,power_law_1.2,0.1115455985069275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,power_law_1.01,0.6083519935607911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,power_law_1.2,0.17238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,power_law_1.01,0.0840511977672577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,power_law_1.2,0.13139840364456176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,power_law_1.01,0.8649472236633301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,power_law_1.2,0.1950976014137268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,power_law_1.01,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,power_law_1.2,0.15639679431915282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,power_law_1.01,1.0982336044311523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,power_law_1.2,0.23503360748291016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,power_law_1.01,0.10329600572586059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,power_law_1.2,0.18465280532836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,power_law_1.01,1.3247167587280273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,power_law_1.2,0.29217920303344724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,power_law_1.01,0.11068160533905029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,power_law_1.2,0.23442559242248534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,power_law_1.01,2.044806480407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,power_law_1.2,0.3724800109863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,power_law_1.01,0.11353600025177002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,power_law_1.2,0.29074559211730955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,power_law_1.2,0.5191103935241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,power_law_1.01,0.11720960140228272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,power_law_1.2,0.39721601009368895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,power_law_1.01,4.540083312988282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,power_law_1.01,0.13197439908981323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,power_law_1.2,0.6499648094177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,power_law_1.2,0.5006656169891357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,power_law_1.01,0.13565440177917482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,power_law_1.2,0.8949055671691895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,power_law_1.2,0.836736011505127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,power_law_1.01,0.1471168041229248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,power_law_1.2,1.3415679931640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,power_law_1.2,1.0435520172119142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,power_law_1.01,0.1454848051071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,power_law_1.2,1.4884223937988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,power_law_1.2,1.2129535675048828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,power_law_1.01,0.1573632001876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,power_law_1.2,2.3411840438842773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,power_law_1.2,2.2549760818481444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,power_law_1.01,0.16799999475479127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,power_law_1.01,0.16577279567718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,power_law_1.2,4.945030212402344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,power_law_1.2,3.981439971923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,power_law_1.01,0.19300479888916017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,power_law_1.01,0.2153343915939331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,power_law_1.01,0.26550400257110596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,power_law_1.01,0.3117824077606201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,power_law_1.01,0.3904320001602173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,power_law_1.01,0.49200639724731443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,power_law_1.01,0.668345594406128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,power_law_1.01,0.8215295791625976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,power_law_1.01,1.1608832359313965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,power_law_1.01,1.4760767936706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,power_law_1.01,0.13345919847488402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,power_law_1.2,0.15066239833831788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,power_law_1.01,0.11543680429458618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,power_law_1.01,1.7644224166870117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,power_law_1.2,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,power_law_1.2,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,power_law_1.01,0.09249280095100403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,power_law_1.2,0.11175040006637574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,power_law_1.01,2.670867156982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,power_law_1.2,0.058259201049804685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,power_law_1.01,0.08245760202407837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,power_law_1.2,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,power_law_1.2,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,power_law_1.01,5.243571090698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,power_law_1.01,0.07714560031890869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,power_law_1.2,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,power_law_1.2,0.08019199967384338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,power_law_1.2,0.08037760257720947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,power_law_1.01,0.08227199912071229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,power_law_1.2,0.07386879920959473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,power_law_1.2,0.10350079536437988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,power_law_1.01,0.09044479727745056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,power_law_1.2,0.08615040183067321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,power_law_1.2,0.10862720012664795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,power_law_1.01,0.09535999894142151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,power_law_1.2,0.09555839896202087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,power_law_1.2,0.10945919752120972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,power_law_1.2,0.11907839775085449
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,power_law_1.01,0.09351680278778077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,power_law_1.2,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,power_law_1.2,0.12277760505676269
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,power_law_1.01,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,power_law_1.2,0.12912000417709352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,power_law_1.01,0.09925119876861573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,power_law_1.2,0.09720320105552674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,power_law_1.2,0.1397696018218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,power_law_1.01,0.09591680169105529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,power_law_1.01,0.09740800261497498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,power_law_1.2,0.09679999947547913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,power_law_1.2,0.14691840410232543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,power_law_1.01,0.09879040122032165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,power_law_1.01,0.10396800041198731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,power_law_1.2,0.15041279792785645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,power_law_1.01,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,power_law_1.2,0.14979840517044068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,power_law_1.01,0.1047808051109314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,power_law_1.2,0.10295039415359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,power_law_1.2,0.16717439889907837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,power_law_1.01,0.06213120222091675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,power_law_1.01,0.10888320207595825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,power_law_1.2,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,power_law_1.2,0.1678272008895874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,power_law_1.01,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,power_law_1.01,0.11811840534210205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,power_law_1.2,0.11809279918670654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,power_law_1.2,0.19711359739303588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,power_law_1.01,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,power_law_1.01,0.12138880491256714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,power_law_1.2,0.13059200048446656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,power_law_1.2,0.21512320041656494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,power_law_1.01,0.08097280263900757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,power_law_1.01,0.13797760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,power_law_1.2,0.2610111951828003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,power_law_1.2,0.15352319478988646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,power_law_1.2,0.3158720016479492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,power_law_1.01,0.08978559970855712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,power_law_1.01,0.15208959579467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,power_law_1.2,0.15148160457611085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,power_law_1.2,0.40517759323120117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,power_law_1.01,0.0875328004360199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,power_law_1.01,0.18138240575790404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,power_law_1.2,0.20020480155944825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,power_law_1.2,0.5206719875335694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,power_law_1.01,0.09449599981307984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,power_law_1.01,0.21599359512329103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,power_law_1.2,0.2366719961166382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,power_law_1.2,0.7051968097686767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,power_law_1.01,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,power_law_1.01,0.28254079818725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,power_law_1.2,0.3022016048431396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,power_law_1.2,0.8223487854003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,power_law_1.01,0.09797760248184204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,power_law_1.01,0.3357952117919922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,power_law_1.2,0.3579200029373169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,power_law_1.2,1.2342016220092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,power_law_1.01,0.10124800205230713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,power_law_1.01,0.44659838676452634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,power_law_1.2,0.4928703784942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,power_law_1.2,1.6243648529052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,power_law_1.01,0.1045375943183899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,power_law_1.01,0.5203135967254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,power_law_1.2,0.5801216125488281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,power_law_1.2,1.8205440521240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,power_law_1.01,0.11006720066070556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,power_law_1.01,0.7396671772003174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,power_law_1.2,0.8764608383178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,power_law_1.2,2.8721855163574217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,power_law_1.01,0.1164031982421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,power_law_1.01,0.9911616325378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,power_law_1.2,1.097043228149414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,power_law_1.2,5.594400024414062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,power_law_1.01,0.12337919473648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,power_law_1.01,1.1990336418151855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,power_law_1.2,1.352633571624756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,power_law_1.01,0.140774405002594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,power_law_1.01,1.8832704544067382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,power_law_1.2,2.0751615524291993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,power_law_1.01,0.1454848051071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,power_law_1.01,0.17415679693222047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,power_law_1.01,3.8110462188720704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,power_law_1.2,4.507769775390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,power_law_1.01,0.20405759811401367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,power_law_1.01,0.26549758911132815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,power_law_1.01,0.3146559953689575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,power_law_1.01,0.41623678207397463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,power_law_1.2,0.0889792025089264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,power_law_1.01,0.5374656200408936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,power_law_1.2,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,power_law_1.01,0.7670527935028076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,power_law_1.2,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,power_law_1.2,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,power_law_1.01,0.9321279525756836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,power_law_1.2,0.0693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,power_law_1.01,1.1895487785339356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,power_law_1.2,0.07710080146789551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,power_law_1.01,0.08923519849777221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,power_law_1.01,1.7816383361816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,power_law_1.2,0.08880640268325805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,power_law_1.2,0.08035839796066284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,power_law_1.01,0.10397440195083618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,power_law_1.2,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,power_law_1.2,0.0846783995628357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,power_law_1.01,3.5330623626708983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,power_law_1.2,0.05927680134773254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,power_law_1.2,0.08692479729652405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,power_law_1.01,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,power_law_1.2,0.09758080244064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,power_law_1.01,0.07815679907798767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,power_law_1.2,0.07363200187683105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,power_law_1.2,0.09546239972114563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,power_law_1.01,0.08268160223960877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,power_law_1.2,0.09675520062446594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,power_law_1.2,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,power_law_1.01,0.08511999845504761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,power_law_1.2,0.10331519842147827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,power_law_1.2,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,power_law_1.01,0.0902463972568512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,power_law_1.2,0.106387197971344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,power_law_1.2,0.0904640018939972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,power_law_1.2,0.11682560443878173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,power_law_1.01,0.09373440146446228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,power_law_1.2,0.09208319783210754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,power_law_1.2,0.11844480037689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,power_law_1.01,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,power_law_1.2,0.09597439765930176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,power_law_1.2,0.12952959537506104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,power_law_1.01,0.10561280250549317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,power_law_1.2,0.09946879744529724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,power_law_1.01,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,power_law_1.2,0.1463104009628296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,power_law_1.01,0.10232959985733033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,power_law_1.2,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,power_law_1.01,0.07420799732208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,power_law_1.2,0.15185279846191407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,power_law_1.01,0.10885759592056274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,power_law_1.2,0.1053887963294983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,power_law_1.01,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,power_law_1.2,0.1913856029510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,power_law_1.01,0.11830400228500366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,power_law_1.2,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,power_law_1.01,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,power_law_1.2,0.2186176061630249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,power_law_1.01,0.12097280025482178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,power_law_1.2,0.12055679559707641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,power_law_1.01,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,power_law_1.2,0.2790208101272583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,power_law_1.01,0.12485120296478272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,power_law_1.2,0.12933119535446166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,power_law_1.01,0.08158720135688782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,power_law_1.2,0.3331007957458496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,power_law_1.01,0.142086398601532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,power_law_1.2,0.14615039825439452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,power_law_1.01,0.08855040073394775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,power_law_1.2,0.4494016170501709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,power_law_1.01,0.15231360197067262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,power_law_1.2,0.16129920482635499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,power_law_1.01,0.09961599707603455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,power_law_1.2,0.5452544212341308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,power_law_1.01,0.18752000331878663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,power_law_1.2,0.18957439661026002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,power_law_1.01,0.10330239534378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,power_law_1.2,0.7838655948638916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,power_law_1.01,0.21006720066070556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,power_law_1.2,0.22316160202026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,power_law_1.01,0.10760960578918458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,power_law_1.2,1.0654591560363769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,power_law_1.01,0.26800639629364015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,power_law_1.2,0.28255999088287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,power_law_1.01,0.10965759754180908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,power_law_1.01,0.3233151912689209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,power_law_1.2,0.3497215986251831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,power_law_1.01,0.112716805934906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,power_law_1.2,1.3972224235534667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,power_law_1.01,0.441267204284668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,power_law_1.01,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,power_law_1.2,0.4633664131164551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,power_law_1.2,2.1070783615112303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,power_law_1.01,0.5617023944854737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,power_law_1.01,0.115174400806427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,power_law_1.2,0.5649600028991699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,power_law_1.2,3.900697708129883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,power_law_1.01,0.12993279695510865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,power_law_1.01,0.8027520179748535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,power_law_1.2,0.8310015678405762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,power_law_1.01,0.13587199449539183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,power_law_1.01,0.9661824226379394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,power_law_1.2,1.0406975746154785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,power_law_1.01,0.14180480241775512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,power_law_1.01,1.1801983833312988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,power_law_1.2,1.3063424110412598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,power_law_1.01,0.16106239557266236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,power_law_1.01,1.827564811706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,power_law_1.2,2.0370624542236326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,power_law_1.01,0.17559679746627807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,power_law_1.01,0.20775039196014405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,power_law_1.01,3.6738433837890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,power_law_1.2,3.9609024047851564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,power_law_1.01,0.2415424108505249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,power_law_1.01,0.3040064096450806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,power_law_1.01,0.3664639949798584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,power_law_1.2,0.07342079877853394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,power_law_1.01,0.4944511890411377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,power_law_1.2,0.07607679963111877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,power_law_1.01,0.6247168064117432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,power_law_1.2,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,power_law_1.01,0.8665920257568359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,power_law_1.2,0.06317440271377564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,power_law_1.01,1.0879103660583496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,power_law_1.2,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,power_law_1.01,1.3796031951904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,power_law_1.2,0.08057600259780884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,power_law_1.01,2.0026111602783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,power_law_1.2,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,power_law_1.2,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,power_law_1.01,4.002489471435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,power_law_1.2,0.10289280414581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,power_law_1.2,0.06894720196723939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,power_law_1.2,0.10618239641189575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,power_law_1.01,0.07018880248069763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,power_law_1.2,0.06854400038719177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,power_law_1.2,0.10884480476379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,power_law_1.01,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,power_law_1.2,0.06627839803695679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,power_law_1.2,0.11638400554656983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,power_law_1.01,0.06567680239677429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,power_law_1.2,0.11724159717559815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,power_law_1.2,0.07487360239028931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,power_law_1.2,0.11621760129928589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,power_law_1.01,0.09128959774971009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,power_law_1.2,0.09043840169906617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,power_law_1.2,0.12931840419769286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,power_law_1.2,0.1342527985572815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,power_law_1.01,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,power_law_1.2,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,power_law_1.2,0.14796160459518432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,power_law_1.01,0.11215360164642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,power_law_1.2,0.16637439727783204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,power_law_1.01,0.12200319766998291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,power_law_1.2,0.17969919443130494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,power_law_1.01,0.12466559410095215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,power_law_1.2,0.21962239742279052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,power_law_1.01,0.13162239789962768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,power_law_1.2,0.24994559288024903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,power_law_1.01,0.1326591968536377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,power_law_1.2,0.317740797996521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,power_law_1.01,0.13920639753341674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,power_law_1.2,0.39146881103515624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,power_law_1.01,0.14328960180282593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,power_law_1.2,0.5112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,power_law_1.01,0.15066879987716675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,power_law_1.01,0.15639679431915282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,power_law_1.2,0.6581183910369873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,power_law_1.01,0.16709760427474976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,power_law_1.2,0.899782371520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,power_law_1.01,0.06418560147285461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,power_law_1.01,0.19162240028381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,power_law_1.01,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,power_law_1.2,1.0957695960998535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,power_law_1.01,0.21334400177001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,power_law_1.01,0.08303359746932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,power_law_1.2,1.4099007606506349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,power_law_1.01,0.25715839862823486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,power_law_1.01,0.07953919768333435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,power_law_1.2,2.216422462463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,power_law_1.01,0.29381120204925537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,power_law_1.01,0.10083839893341065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,power_law_1.2,4.191302490234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,power_law_1.01,0.37881600856781006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,power_law_1.01,0.12030719518661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,power_law_1.01,0.4539775848388672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,power_law_1.01,0.1387392044067383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,power_law_1.01,0.6087999820709229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,power_law_1.01,0.16720000505447388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,power_law_1.01,0.7970047950744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,power_law_1.01,0.18399360179901122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,power_law_1.01,0.17170560359954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,power_law_1.01,1.0581184387207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,power_law_1.01,0.194649600982666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,power_law_1.01,1.3219200134277345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,power_law_1.01,0.19792640209197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,power_law_1.01,1.6174400329589844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,power_law_1.01,0.19668480157852172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,power_law_1.01,2.521824073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,power_law_1.01,0.196288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,power_law_1.01,0.20918400287628175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,power_law_1.01,4.848793411254883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,power_law_1.01,0.21921279430389404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,power_law_1.01,0.22739839553833008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,8,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,power_law_1.01,0.2579200029373169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,8,power_law_1.01,0.018169599771499633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,power_law_1.01,0.33943040370941163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,8,power_law_1.01,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,8,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,power_law_1.01,0.4104896068572998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,8,power_law_1.01,0.01918720006942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,power_law_1.01,0.4109183788299561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,8,power_law_1.01,0.019782400131225585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,8,power_law_1.01,0.019596800208091736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,power_law_1.01,0.5186367988586426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,8,power_law_1.01,0.021036800742149354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,power_law_1.01,0.6400767803192139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,8,power_law_1.01,0.021638399362564086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,power_law_1.2,0.0650111973285675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,8,power_law_1.01,0.022259199619293214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,power_law_1.01,0.8374784469604493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,power_law_1.2,0.0705407977104187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,8,power_law_1.01,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,power_law_1.01,1.0715840339660645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,8,power_law_1.01,0.02696320116519928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,8,power_law_1.01,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,power_law_1.01,1.4809791564941406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,power_law_1.2,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,8,power_law_1.01,0.02778880000114441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,8,power_law_1.01,0.029836800694465638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,power_law_1.2,0.09389439821243287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,power_law_1.01,1.8961151123046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,8,power_law_1.01,0.0341376006603241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,power_law_1.2,0.11416959762573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,8,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,power_law_1.01,2.234457588195801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,8,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,power_law_1.2,0.13176319599151612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,power_law_1.01,3.447065734863281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,8,power_law_1.01,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,power_law_1.2,0.16392960548400878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,8,power_law_1.01,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,8,power_law_1.01,0.08001279830932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,power_law_1.2,0.17909120321273803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,power_law_1.01,6.730419158935547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,8,power_law_1.01,0.11912959814071655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,power_law_1.2,0.17827199697494506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,8,power_law_1.01,0.15271040201187133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,power_law_1.2,0.18152960538864135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,8,power_law_1.01,0.21742079257965088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,8,8,power_law_1.2,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,8,power_law_1.01,0.27559680938720704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,power_law_1.2,0.20079360008239747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,8,8,power_law_1.2,0.018508799374103546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,8,power_law_1.01,0.405836820602417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,power_law_1.2,0.2065279960632324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,8,8,power_law_1.2,0.019123199582099914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,8,power_law_1.01,0.5293375968933105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,8,8,power_law_1.2,0.018905599415302277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,8,power_law_1.01,0.6401408195495606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,8,8,power_law_1.2,0.019519999623298645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,8,power_law_1.01,1.0696000099182128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,8,8,power_law_1.2,0.019942399859428406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,8,power_law_1.01,2.1214527130126952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,8,8,power_law_1.2,0.020364800095558168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,8,8,power_law_1.2,0.021376000344753267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,8,8,power_law_1.2,0.021996800601482392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,8,8,power_law_1.2,0.022201600670814513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,8,power_law_1.01,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,8,8,power_law_1.2,0.023231999576091768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,8,power_law_1.01,0.03824639916419983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,8,8,power_law_1.2,0.027526399493217467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,8,power_law_1.01,0.036800000071525577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,8,8,power_law_1.2,0.02691200077533722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,8,power_law_1.01,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,8,8,power_law_1.2,0.02752000093460083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,8,power_law_1.01,0.03700479865074158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,8,power_law_1.01,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,8,power_law_1.01,0.03903999924659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,8,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,8,power_law_1.01,0.03759360015392303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,8,power_law_1.01,0.03920640051364899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,8,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,8,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,8,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,8,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,8,power_law_1.01,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,8,power_law_1.01,0.049292799830436704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,8,power_law_1.01,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,8,power_law_1.01,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,8,power_law_1.01,0.06465920209884643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,8,power_law_1.01,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,8,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,8,power_law_1.01,0.11422079801559448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,8,power_law_1.01,0.12609920501708985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,8,power_law_1.01,0.1764799952507019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,8,power_law_1.01,0.21578240394592285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,8,power_law_1.01,0.3087680101394653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,8,power_law_1.01,0.39110400676727297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,8,power_law_1.01,0.5272960186004638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,8,power_law_1.01,0.8088895797729492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,8,power_law_1.01,1.6022911071777344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,8,8,power_law_1.2,0.03681280016899109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,8,8,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,8,8,power_law_1.2,0.03678080141544342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,8,8,power_law_1.2,0.03619199991226196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,8,8,power_law_1.2,0.037555199861526486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,8,8,power_law_1.2,0.03680639863014221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,8,8,power_law_1.2,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,8,8,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,8,8,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,8,8,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,8,8,power_law_1.2,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,8,8,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,8,8,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,8,8,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,8,8,power_law_1.2,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,8,8,power_law_1.2,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,8,8,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,8,8,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,8,8,power_law_1.2,0.0664255976676941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,8,8,power_law_1.2,0.07858560085296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,8,8,power_law_1.2,0.08800640106201171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,8,8,power_law_1.2,0.11256959438323974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,8,8,power_law_1.2,0.13612159490585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,8,8,power_law_1.2,0.18876160383224488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,8,8,power_law_1.2,0.2246016025543213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,8,8,power_law_1.2,0.3194175958633423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,8,8,power_law_1.2,0.41731839179992675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,8,8,power_law_1.2,0.519865608215332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,8,8,power_law_1.2,0.7826879978179931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,8,8,power_law_1.2,1.661676788330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,power_law_1.2,0.11296639442443848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,4,power_law_1.01,0.018156799674034118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,4,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,power_law_1.2,0.12320640087127685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,4,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,power_law_1.2,0.12322560548782349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,4,power_law_1.01,0.01754239946603775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,power_law_1.2,0.1252671957015991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,4,power_law_1.01,0.018566399812698364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,4,power_law_1.01,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,power_law_1.2,0.1307968020439148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,4,power_law_1.01,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,4,power_law_1.01,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,power_law_1.2,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,4,power_law_1.01,0.02327679991722107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,power_law_1.2,0.14287999868392945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,4,power_law_1.01,0.023071999847888946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,4,power_law_1.01,0.02451840043067932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,power_law_1.2,0.1543552041053772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,4,power_law_1.01,0.028191998600959778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,power_law_1.2,0.15926400423049927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,4,power_law_1.01,0.029023998975753786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,4,power_law_1.01,0.028198400139808656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,power_law_1.2,0.16807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,4,power_law_1.01,0.02983039915561676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,4,power_law_1.01,0.03270399868488312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,power_law_1.2,0.19081599712371827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,4,power_law_1.01,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,power_law_1.2,0.21701760292053224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,4,power_law_1.01,0.04888319969177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,4,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,power_law_1.2,0.2575743913650513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,4,power_law_1.01,0.07017599940299987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,power_law_1.2,0.2989376068115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,4,power_law_1.01,0.085343998670578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,4,power_law_1.01,0.1066431999206543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,power_law_1.2,0.3775871992111206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,4,power_law_1.01,0.1449280023574829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,power_law_1.2,0.463372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,4,power_law_1.01,0.2192768096923828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,4,power_law_1.01,0.27088000774383547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,power_law_1.2,0.6333695888519287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,4,power_law_1.01,0.410752010345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,power_law_1.2,0.7888256072998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,4,power_law_1.01,0.5158336162567139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,4,power_law_1.01,0.625600004196167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,power_law_1.2,1.090073585510254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,4,power_law_1.01,0.8281344413757324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,power_law_1.2,1.3554944038391112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,4,power_law_1.01,1.8840959548950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,power_law_1.2,1.7226560592651368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,power_law_1.2,2.5688703536987303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,4,power_law_1.2,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,power_law_1.2,4.958943939208984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,4,power_law_1.2,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,4,power_law_1.2,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,4,power_law_1.2,0.01754239946603775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,4,power_law_1.2,0.018156799674034118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,4,power_law_1.01,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,4,power_law_1.2,0.02205439954996109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,4,power_law_1.01,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,4,power_law_1.2,0.02082560062408447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,4,power_law_1.01,0.03763200044631958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,4,power_law_1.2,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,4,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,4,power_law_1.2,0.02328319996595383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,4,power_law_1.01,0.038227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,4,power_law_1.2,0.02328319996595383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,4,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,4,power_law_1.2,0.025331199169158936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,4,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,4,power_law_1.2,0.026764801144599913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,4,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,4,power_law_1.2,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,4,power_law_1.01,0.03945600092411041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,4,power_law_1.2,0.028601598739624024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,4,power_law_1.01,0.04046080112457275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,4,power_law_1.2,0.02963840067386627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,4,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,4,power_law_1.2,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,4,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,4,power_law_1.2,0.03372800052165985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,4,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,4,power_law_1.2,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,4,power_law_1.01,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,4,power_law_1.2,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,4,power_law_1.01,0.0484607994556427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,4,power_law_1.2,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,4,power_law_1.01,0.05030400156974792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,4,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,4,power_law_1.2,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,4,power_law_1.01,0.06177279949188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,4,power_law_1.2,0.12650879621505737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,4,power_law_1.01,0.0695680022239685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,4,power_law_1.2,0.14330240488052368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,4,power_law_1.01,0.07735040187835693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,4,power_law_1.2,0.1908031940460205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,4,power_law_1.01,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,4,power_law_1.2,0.26698238849639894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,4,power_law_1.01,0.12649600505828856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,4,power_law_1.2,0.3804287910461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,4,power_law_1.01,0.1275264024734497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,4,power_law_1.2,0.508454418182373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,4,power_law_1.01,0.19367040395736695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,4,power_law_1.2,0.627238416671753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,4,power_law_1.01,0.22807679176330567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,4,power_law_1.2,0.9817472457885742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,4,power_law_1.01,0.3145024061203003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,4,power_law_1.2,2.177568054199219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,4,power_law_1.01,0.43512959480285646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,4,power_law_1.01,0.545305585861206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,4,power_law_1.01,0.9571647644042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,power_law_1.2,0.19527039527893067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,4,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,4,power_law_1.01,1.939993667602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,power_law_1.2,0.20981760025024415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,4,power_law_1.2,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,4,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,power_law_1.2,0.21430399417877197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,4,power_law_1.2,0.03678080141544342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,power_law_1.2,0.23887999057769777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,4,power_law_1.2,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,4,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,power_law_1.2,0.26796159744262693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,8,power_law_1.01,0.019577600061893463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,4,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,8,power_law_1.01,0.018969599902629853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,power_law_1.2,0.2984895944595337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,4,power_law_1.2,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,8,power_law_1.01,0.019788800179958342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,power_law_1.2,0.35849599838256835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,4,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,8,power_law_1.01,0.019167999923229217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,4,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,8,power_law_1.01,0.020627200603485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,power_law_1.2,0.4117311954498291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,8,8,power_law_1.2,0.03059200048446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,8,power_law_1.01,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,4,power_law_1.2,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,power_law_1.2,0.5247935771942138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,8,8,power_law_1.2,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,8,power_law_1.01,0.022035199403762817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,4,power_law_1.2,0.04273920059204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,8,8,power_law_1.2,0.040012800693511964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,8,power_law_1.01,0.023481599986553192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,4,power_law_1.2,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,power_law_1.2,0.6572735786437989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,8,8,power_law_1.2,0.04556800127029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,8,power_law_1.01,0.024294400215148927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,4,power_law_1.2,0.04499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,power_law_1.2,0.8694592475891113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,8,power_law_1.01,0.02449920028448105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,8,8,power_law_1.2,0.05190399885177612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,4,power_law_1.2,0.05194240212440491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,8,power_law_1.01,0.02573440074920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,8,8,power_law_1.2,0.07278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,4,power_law_1.2,0.05134080052375793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,power_law_1.2,1.10066556930542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,8,power_law_1.01,0.02983039915561676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,4,power_law_1.2,0.055430400371551516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,power_law_1.2,1.4867263793945313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,8,power_law_1.01,0.030444800853729248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,4,power_law_1.2,0.06240000128746033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,8,power_law_1.01,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,4,power_law_1.2,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,power_law_1.2,1.8123519897460938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,8,power_law_1.01,0.04270719885826111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,4,power_law_1.2,0.08083840012550354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,8,power_law_1.01,0.03935999870300293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,4,power_law_1.2,0.09085440039634704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,power_law_1.2,2.238547134399414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,8,power_law_1.01,0.048870399594306946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,4,power_law_1.2,0.12199679613113404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,8,power_law_1.01,0.06176000237464905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,power_law_1.2,3.4954113006591796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,4,power_law_1.2,0.14494719505310058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,8,power_law_1.01,0.06320639848709106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,4,power_law_1.2,0.20371201038360595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,8,power_law_1.01,0.10744960308074951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,4,power_law_1.2,0.2526592016220093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,power_law_1.2,6.594847869873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,8,power_law_1.01,0.12710399627685548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,4,power_law_1.2,0.3749183893203735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,8,power_law_1.01,0.18670079708099366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,4,power_law_1.2,0.43962879180908204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,8,power_law_1.01,0.22663679122924804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,4,power_law_1.2,0.5977344036102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,8,power_law_1.01,0.322873592376709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,4,power_law_1.2,0.9936127662658691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,8,8,power_law_1.2,0.0201664000749588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,8,power_law_1.01,0.43349761962890626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,4,power_law_1.2,1.9318016052246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,8,8,power_law_1.2,0.02077440023422241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,8,power_law_1.01,0.6704319953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,8,8,power_law_1.2,0.02078080028295517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,8,power_law_1.01,0.8539327621459961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,8,8,power_law_1.2,0.02035840004682541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,8,power_law_1.01,1.0921216011047363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,8,8,power_law_1.2,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,8,power_law_1.01,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,8,power_law_1.01,1.5609024047851563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,8,8,power_law_1.2,0.023027199506759643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,8,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,8,power_law_1.01,3.3250686645507814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,8,8,power_law_1.2,0.022419199347496033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,8,power_law_1.01,0.04108799993991852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,8,8,power_law_1.2,0.02465279996395111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,8,power_law_1.01,0.03885439932346344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,8,8,power_law_1.2,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,8,power_law_1.01,0.03844479918479919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,8,8,power_law_1.2,0.02507520020008087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,8,8,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,8,power_law_1.01,0.03948160111904144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,8,8,power_law_1.2,0.027353599667549133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,8,8,power_law_1.2,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,8,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,8,8,power_law_1.2,0.03080959916114807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,8,8,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,8,power_law_1.01,0.04087679982185364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,8,8,power_law_1.2,0.03162879943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,8,8,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,8,power_law_1.01,0.041094401478767396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,8,8,power_law_1.2,0.032652801275253295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,8,8,power_law_1.2,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,8,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,8,8,power_law_1.2,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,8,8,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,8,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,8,8,power_law_1.2,0.046988800168037415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,8,8,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,8,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,8,8,power_law_1.2,0.04965119957923889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,8,8,power_law_1.2,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,8,power_law_1.01,0.044172799587249754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,8,8,power_law_1.2,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,8,8,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,8,power_law_1.01,0.04497919976711273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,8,8,power_law_1.2,0.08056319952011108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,8,8,power_law_1.2,0.042310398817062375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,8,power_law_1.01,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,8,8,power_law_1.2,0.10167039632797241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,8,8,power_law_1.2,0.041280001401901245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,8,power_law_1.01,0.05175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,8,8,power_law_1.2,0.12789119482040406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,8,8,power_law_1.2,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,8,power_law_1.01,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,8,8,power_law_1.2,0.18481919765472413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,8,8,power_law_1.2,0.04395520091056824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,8,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,8,8,power_law_1.2,0.23274240493774415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,8,8,power_law_1.2,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,8,power_law_1.01,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,8,8,power_law_1.2,0.32734720706939696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,8,8,power_law_1.2,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,8,power_law_1.01,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,8,8,power_law_1.2,0.4526847839355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,8,8,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,8,power_law_1.01,0.10622080564498901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,8,8,power_law_1.2,0.6630208015441894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,8,8,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,8,power_law_1.01,0.14041600227355958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,8,8,power_law_1.2,0.8391424179077148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,8,8,power_law_1.2,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,8,power_law_1.01,0.16254080533981324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,8,8,power_law_1.2,1.090022373199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,8,8,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,8,power_law_1.01,0.23831679821014404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,8,8,power_law_1.2,1.691935920715332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,8,8,power_law_1.2,0.09003520011901855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,8,power_law_1.01,0.2845952033996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,8,8,power_law_1.2,0.10990719795227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,8,8,power_law_1.2,3.449932861328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,8,power_law_1.01,0.41443839073181155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,8,8,power_law_1.2,0.1322175979614258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,8,power_law_1.01,0.5444992065429688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,8,8,power_law_1.2,0.16826879978179932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,8,power_law_1.01,0.6794559955596924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,8,8,power_law_1.2,0.24117119312286378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,8,8,power_law_1.2,0.2858367919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,8,power_law_1.01,1.0839424133300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,4,power_law_1.01,0.019948799908161164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,8,8,power_law_1.2,0.4132095813751221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,8,power_law_1.01,2.3037248611450196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,4,power_law_1.01,0.019545599818229675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,8,8,power_law_1.2,0.5358848094940185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,4,power_law_1.01,0.01973759979009628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,8,8,power_law_1.2,0.7040256023406982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,4,power_law_1.01,0.019756799936294554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,8,8,power_law_1.2,1.1060416221618652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,4,power_law_1.01,0.0201664000749588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,4,power_law_1.01,0.02220800071954727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,8,8,power_law_1.2,2.282009506225586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,4,power_law_1.2,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,4,power_law_1.01,0.02200320065021515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,4,power_law_1.2,0.019174399971961974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,4,power_law_1.01,0.022419199347496033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,4,power_law_1.2,0.018982400000095368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,4,power_law_1.01,0.024255999922752382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,4,power_law_1.01,0.04395520091056824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,4,power_law_1.2,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,4,power_law_1.01,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,4,power_law_1.01,0.04108799993991852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,4,power_law_1.01,0.025491198897361754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,4,power_law_1.2,0.020422400534152986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,4,power_law_1.01,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,4,power_law_1.01,0.029996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,4,power_law_1.2,0.02205439954996109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,4,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,4,power_law_1.01,0.03080959916114807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,4,power_law_1.2,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,4,power_law_1.01,0.04110080003738403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,4,power_law_1.01,0.03162879943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,4,power_law_1.2,0.022867199778556824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,4,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,4,power_law_1.01,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,4,power_law_1.2,0.024716800451278685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,4,power_law_1.01,0.033888000249862674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,4,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,4,power_law_1.2,0.02512640058994293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,4,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,4,power_law_1.01,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,4,power_law_1.2,0.0253248006105423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,4,power_law_1.01,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,4,power_law_1.01,0.04211199879646301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,4,power_law_1.2,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,4,power_law_1.01,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,4,power_law_1.01,0.042310398817062375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,4,power_law_1.2,0.030656000971794127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,4,power_law_1.01,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,4,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,4,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,4,power_law_1.01,0.09386879801750184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,4,power_law_1.01,0.044377601146698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,4,power_law_1.2,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,4,power_law_1.01,0.12911360263824462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,4,power_law_1.01,0.04456959962844849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,4,power_law_1.2,0.0341376006603241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,4,power_law_1.01,0.15697280168533326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,4,power_law_1.01,0.04745599925518036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,4,power_law_1.2,0.046828800439834596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,4,power_law_1.01,0.05194240212440491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,4,power_law_1.01,0.23438079357147218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,4,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,4,power_law_1.01,0.05502079725265503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,4,power_law_1.01,0.33330559730529785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,4,power_law_1.2,0.06567680239677429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,4,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,4,power_law_1.01,0.41747198104858396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,4,power_law_1.2,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,4,power_law_1.01,0.06709759831428527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,4,power_law_1.01,0.5432191848754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,4,power_law_1.2,0.10908160209655762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,4,power_law_1.01,0.0775488018989563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,4,power_law_1.01,0.7600959777832031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,4,power_law_1.2,0.1410431981086731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,4,power_law_1.01,0.09311360120773315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,4,power_law_1.01,1.1227968215942383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,4,power_law_1.2,0.1881343960762024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,4,power_law_1.01,0.11071360111236572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,4,power_law_1.2,0.2755903959274292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,4,power_law_1.01,2.143916893005371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,4,power_law_1.01,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,4,power_law_1.2,0.3775552034378052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,4,power_law_1.01,0.16396160125732423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,4,power_law_1.2,0.5669888019561767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,4,power_law_1.01,0.21332480907440185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,4,power_law_1.2,0.7396736145019531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,4,power_law_1.2,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,4,power_law_1.01,0.2735424041748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,4,power_law_1.2,0.8084927558898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,4,power_law_1.2,0.04352000057697296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,4,power_law_1.01,0.40728321075439455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,4,power_law_1.2,0.041043201088905336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,4,power_law_1.2,1.32107515335083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,4,power_law_1.01,0.5203135967254638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,4,power_law_1.2,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,4,power_law_1.01,0.717139196395874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,4,power_law_1.2,3.1176000595092774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,4,power_law_1.2,0.04289920032024384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,4,power_law_1.01,1.1154623985290528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,4,power_law_1.2,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,4,power_law_1.2,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,4,power_law_1.01,2.1812416076660157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,4,power_law_1.2,0.04349440038204193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,2,power_law_1.01,0.018572799861431122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,4,power_law_1.2,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,2,power_law_1.01,0.018572799861431122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,4,power_law_1.2,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,2,power_law_1.01,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,2,power_law_1.2,0.018355199694633485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,4,power_law_1.2,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,2,power_law_1.01,0.019603200256824493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,2,power_law_1.2,0.018355199694633485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,4,power_law_1.2,0.04535680115222931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,2,power_law_1.01,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,2,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,4,power_law_1.2,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,2,power_law_1.01,0.02143999934196472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,2,power_law_1.2,0.019392000138759614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,4,power_law_1.2,0.0488319993019104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,2,power_law_1.01,0.022047999501228332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,2,power_law_1.2,0.01958400011062622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,4,power_law_1.2,0.05294079780578613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,2,power_law_1.2,0.020812800526618956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,4,power_law_1.2,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,2,power_law_1.01,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,2,power_law_1.2,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,4,power_law_1.2,0.06050559878349304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,2,power_law_1.01,0.023686400055885314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,4,power_law_1.2,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,2,power_law_1.2,0.022035199403762817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,2,power_law_1.01,0.02391680032014847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,4,power_law_1.2,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,2,power_law_1.2,0.023680000007152556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,2,power_law_1.01,0.02492160052061081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,4,power_law_1.2,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,2,power_law_1.2,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,2,power_law_1.01,0.029836800694465638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,4,power_law_1.2,0.11457279920578003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,2,power_law_1.2,0.024716800451278685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,2,power_law_1.01,0.030880001187324525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,4,power_law_1.2,0.16147840023040771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,2,power_law_1.2,0.029414400458335876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,2,power_law_1.01,0.03144960105419159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,4,power_law_1.2,0.18440959453582764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,2,power_law_1.2,0.030643200874328612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,2,power_law_1.01,0.03311359882354736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,2,power_law_1.2,0.03126400113105774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,4,power_law_1.2,0.2544447898864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,2,power_law_1.01,0.03330560028553009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,2,power_law_1.2,0.032492798566818235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,4,power_law_1.2,0.3457920074462891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,2,power_law_1.01,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,2,power_law_1.2,0.03330560028553009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,4,power_law_1.2,0.5039040088653565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,2,power_law_1.01,0.04026240110397339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,2,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,2,power_law_1.01,0.052767997980117796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,4,power_law_1.2,0.6169343948364258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,2,power_law_1.2,0.04047360122203827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,2,power_law_1.01,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,4,power_law_1.2,0.7473983764648438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,2,power_law_1.2,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,2,power_law_1.01,0.07900159955024719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,4,power_law_1.2,1.1182975769042969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,2,power_law_1.2,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,2,power_law_1.01,0.11050239801406861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,4,power_law_1.2,2.3579456329345705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,2,power_law_1.2,0.09188479781150818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,2,power_law_1.01,0.1359231948852539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,2,power_law_1.2,0.11460479497909545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,2,power_law_1.01,0.20657920837402344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,2,power_law_1.2,0.15905280113220216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,2,power_law_1.01,0.2723072052001953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,2,power_law_1.2,0.19939839839935303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,2,power_law_1.01,0.04126079976558685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,2,power_law_1.01,0.4023871898651123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,2,power_law_1.2,0.27068800926208497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,2,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,2,power_law_1.01,0.4773119926452637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,2,power_law_1.2,0.3474751949310303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,2,power_law_1.01,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,2,power_law_1.01,0.6593791961669921
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,2,power_law_1.01,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,2,power_law_1.2,0.497376012802124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,2,power_law_1.01,0.917843246459961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,2,power_law_1.01,0.045151999592781066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,2,power_law_1.2,0.6454336166381835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,2,power_law_1.01,1.9113279342651368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,2,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,2,power_law_1.2,1.0235136032104493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,2,power_law_1.01,0.046163201332092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,2,power_law_1.2,2.0427967071533204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,2,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,2,power_law_1.01,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,2,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,2,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,2,power_law_1.2,0.04004479944705963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,2,power_law_1.01,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,2,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,8,8,power_law_1.2,0.08855040073394775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,2,power_law_1.01,0.047603198885917665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,2,power_law_1.2,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,8,8,power_law_1.2,0.1188480019569397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,2,power_law_1.01,0.048019200563430786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,2,power_law_1.2,0.04333440065383911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,8,8,power_law_1.2,0.15245440006256103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,2,power_law_1.01,0.04902400076389313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,2,power_law_1.2,0.04355199933052063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,8,8,power_law_1.2,0.22330880165100098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,2,power_law_1.01,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,64,power_law_1.01,0.02858879864215851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,2,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,8,8,power_law_1.2,0.28330240249633787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,2,power_law_1.01,0.05699840188026428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,64,power_law_1.01,0.028198400139808656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,2,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,8,8,power_law_1.2,0.42729601860046384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,2,power_law_1.01,0.061952000856399535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,2,power_law_1.2,0.04704639911651611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,64,power_law_1.01,0.027577599883079527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,2,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,8,8,power_law_1.2,0.4625088214874268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,2,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,64,power_law_1.01,0.027161601185798644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,2,power_law_1.01,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,8,8,power_law_1.2,0.6593152046203613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,2,power_law_1.2,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,2,power_law_1.01,0.09921919703483581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,64,power_law_1.01,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,8,8,power_law_1.2,1.0629952430725098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,2,power_law_1.2,0.04723840057849884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,2,power_law_1.01,0.10863360166549682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,64,power_law_1.01,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,2,power_law_1.2,0.04723840057849884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,2,power_law_1.01,0.1383296012878418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,2,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,64,power_law_1.01,0.04580479860305786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,2,power_law_1.01,0.18275840282440187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,2,power_law_1.2,0.05624960064888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,2,power_law_1.01,0.236844801902771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,64,power_law_1.01,0.04867840111255646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,2,power_law_1.2,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,2,power_law_1.01,0.31055359840393065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,64,power_law_1.01,0.05071359872817993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,2,power_law_1.2,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,2,power_law_1.01,0.43140478134155275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,64,power_law_1.01,0.06074240207672119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,2,power_law_1.2,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,2,power_law_1.01,0.6087488174438477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,2,power_law_1.2,0.07487360239028931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,64,power_law_1.01,0.06895359754562377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,2,power_law_1.01,0.6695680141448974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,2,power_law_1.2,0.09455360174179077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,64,power_law_1.01,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,2,power_law_1.01,1.032902431488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,2,power_law_1.2,0.11255680322647095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,64,power_law_1.01,0.08799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,2,power_law_1.01,2.1672576904296874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,2,power_law_1.2,0.15394560098648072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,2,power_law_1.2,0.16172159910202027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,64,power_law_1.01,0.10929919481277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,2,power_law_1.2,0.24056320190429686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,64,power_law_1.01,0.07979519963264466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,2,power_law_1.2,0.27149438858032227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,64,power_law_1.01,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,2,power_law_1.2,0.42203521728515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,64,power_law_1.01,0.11317119598388672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,64,power_law_1.2,0.021804800629615782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,2,power_law_1.2,0.5367104053497315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,2,power_law_1.2,0.690937614440918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,64,power_law_1.01,0.10069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,64,power_law_1.2,0.021798400580883025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,2,power_law_1.2,1.238758373260498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,64,power_law_1.2,0.021798400580883025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.01,0.12403199672698975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,64,power_law_1.2,0.021593600511550903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.01,0.17768319845199584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,2,power_law_1.2,2.190675163269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,64,power_law_1.2,0.023417599499225616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.01,0.22479360103607177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,64,power_law_1.2,0.0271232008934021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.01,0.337606406211853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,64,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,64,power_law_1.2,0.0332863986492157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.01,0.4310336112976074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,64,power_law_1.01,0.08880640268325805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,64,power_law_1.2,0.03511680066585541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.01,0.6491456031799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,64,power_law_1.2,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.01,0.8707455635070801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,64,power_law_1.2,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.01,1.3911359786987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,64,power_law_1.2,0.05088000297546387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.01,1.5207743644714355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,64,power_law_1.2,0.05927680134773254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,64,power_law_1.01,2.0411584854125975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,64,power_law_1.2,0.06682239770889283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,64,power_law_1.2,0.08241919875144958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,64,power_law_1.01,3.3201534271240236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,64,power_law_1.2,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,64,power_law_1.01,6.755872344970703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,64,power_law_1.2,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,64,power_law_1.2,0.08754559755325317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,64,power_law_1.2,0.07752320170402527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,64,power_law_1.2,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.2,0.09589759707450866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,64,power_law_1.2,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.2,0.13395839929580688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,64,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.2,0.15942399501800536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,64,power_law_1.2,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.2,0.23315200805664063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,64,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.2,0.3007359981536865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,64,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.2,0.4416384220123291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,64,power_law_1.2,0.06709759831428527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.2,0.5824704170227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,64,power_law_1.2,0.07099519968032837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.2,0.8620223999023438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,64,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.2,1.1449151992797852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,64,power_law_1.2,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,64,power_law_1.2,1.4230463981628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,64,power_law_1.2,0.07159680128097534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,64,power_law_1.2,2.25863037109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,64,power_law_1.2,0.07509120106697083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,64,power_law_1.2,0.07365120053291321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,64,power_law_1.2,4.4184318542480465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,64,power_law_1.2,0.07774080038070678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,64,power_law_1.2,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,64,power_law_1.2,0.09556480050086975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,64,power_law_1.2,0.09946879744529724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,32,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,64,power_law_1.2,0.11051520109176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,32,power_law_1.01,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.2,0.12342400550842285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,32,power_law_1.01,0.021593600511550903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.2,0.1465664029121399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,32,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.2,0.15762560367584227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,32,power_law_1.01,0.024672000110149382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.2,0.20227200984954835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,32,power_law_1.01,0.025286400318145753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.2,0.25982720851898194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,32,power_law_1.01,0.028563201427459717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.2,0.32739839553833006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,32,power_law_1.01,0.03429119884967804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.2,0.4074944019317627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,32,power_law_1.01,0.03798399865627289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.2,0.6067584037780762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,32,power_law_1.01,0.04063999950885773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.2,0.7560448169708252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,32,power_law_1.01,0.0463808000087738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,64,power_law_1.2,0.9837823867797851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,32,power_law_1.01,0.05371519923210144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,32,power_law_1.01,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,64,power_law_1.2,1.7476224899291992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,32,power_law_1.01,0.07383679747581481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,64,power_law_1.2,3.572652816772461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,32,power_law_1.01,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,32,power_law_1.01,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,32,power_law_1.01,0.07832319736480713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,32,power_law_1.01,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,32,power_law_1.01,0.08441600203514099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,32,power_law_1.01,0.09880959987640381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,32,power_law_1.01,0.12338559627532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,32,power_law_1.01,0.17437440156936646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,32,power_law_1.2,0.0324864000082016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,32,power_law_1.01,0.22167680263519288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,32,power_law_1.2,0.031052801012992858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,32,power_law_1.01,0.3230655908584595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,32,power_law_1.2,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,32,power_law_1.01,0.42237439155578616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,32,power_law_1.2,0.0253248006105423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,32,power_law_1.2,0.03221119940280914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,32,power_law_1.01,0.6218688011169433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,32,power_law_1.2,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,32,power_law_1.01,0.8202879905700684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,32,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,32,power_law_1.01,1.0185536384582519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,32,power_law_1.2,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,32,power_law_1.01,1.6104320526123046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,32,power_law_1.2,0.049292799830436704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,32,power_law_1.2,0.05516160130500793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,32,power_law_1.01,3.2017215728759765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,32,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,32,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,32,power_law_1.2,0.08572800159454345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,32,power_law_1.01,0.0807807981967926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,32,power_law_1.2,0.10437120199203491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,32,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,32,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,32,power_law_1.01,0.06788480281829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,32,power_law_1.2,0.09229440093040467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,32,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,32,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,32,power_law_1.01,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,32,power_law_1.2,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,32,power_law_1.01,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,32,power_law_1.2,0.1268671989440918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,32,power_law_1.01,0.07320320010185241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,32,power_law_1.01,0.07112320065498352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,32,power_law_1.2,0.1643839955329895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,32,power_law_1.01,0.07505279779434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,32,power_law_1.2,0.20923519134521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,32,power_law_1.01,0.07504640221595764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,32,power_law_1.2,0.29034240245819093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,32,power_law_1.01,0.0744383990764618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,32,power_law_1.2,0.3800384044647217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,32,power_law_1.01,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,32,power_law_1.2,0.5698944091796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,32,power_law_1.01,0.08078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,32,power_law_1.2,0.7654784202575684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,32,power_law_1.01,0.08222079873085023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,32,power_law_1.2,1.0696000099182128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,32,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,32,power_law_1.2,1.5248640060424805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,32,power_law_1.01,0.09122560024261475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,32,power_law_1.2,1.9170368194580079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,32,power_law_1.01,0.0996288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,32,power_law_1.01,0.11478400230407715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,32,power_law_1.2,3.1701568603515624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,32,power_law_1.01,0.12541439533233642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,32,power_law_1.2,6.766099548339843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,32,power_law_1.01,0.15164799690246583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,32,power_law_1.01,0.16024960279464723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,32,power_law_1.01,0.19586559534072875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,32,power_law_1.01,0.23519999980926515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,32,power_law_1.2,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,8,8,power_law_1.2,2.1803775787353517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,32,power_law_1.2,0.07342720031738281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,32,power_law_1.01,0.29703679084777834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,32,power_law_1.2,0.0630016028881073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,32,power_law_1.01,0.381606388092041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,32,power_law_1.2,0.06094719767570496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,32,power_law_1.01,0.5189824104309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,32,power_law_1.2,0.06381440162658691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,32,power_law_1.01,0.6888192176818848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,16,power_law_1.01,0.022809599339962006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,32,power_law_1.2,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,32,power_law_1.01,0.8071935653686524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,16,power_law_1.01,0.027935999631881713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,32,power_law_1.2,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,16,power_law_1.01,0.022201600670814513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,32,power_law_1.01,1.300147247314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,32,power_law_1.2,0.07017599940299987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,16,power_law_1.01,0.02343679964542389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,32,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,32,power_law_1.01,2.4792448043823243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,16,power_law_1.01,0.026707199215888978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,32,power_law_1.2,0.07405440211296081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,16,power_law_1.01,0.029971200227737426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,32,power_law_1.2,0.07604479789733887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,32,power_law_1.2,0.08102399706840516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,16,power_law_1.01,0.03919360041618347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,16,power_law_1.2,0.021190400421619415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,32,power_law_1.2,0.07796480059623719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,16,power_law_1.01,0.039603200554847715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,16,power_law_1.2,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,32,power_law_1.2,0.08019840121269226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,16,power_law_1.01,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,16,power_law_1.2,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,32,power_law_1.2,0.08798720240592957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,16,power_law_1.01,0.04759680032730103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,16,power_law_1.2,0.02218240052461624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,32,power_law_1.2,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,16,power_law_1.01,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,16,power_law_1.2,0.02426239997148514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,32,power_law_1.2,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,16,power_law_1.01,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,16,power_law_1.2,0.02712959945201874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,32,power_law_1.2,0.11255040168762206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,16,power_law_1.01,0.06499840021133423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,16,power_law_1.2,0.02917119860649109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,32,power_law_1.2,0.1273151993751526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,16,power_law_1.01,0.07627519965171814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,16,power_law_1.2,0.033478400111198424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,32,power_law_1.2,0.15066879987716675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,16,power_law_1.01,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,16,power_law_1.2,0.040428799390792844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,32,power_law_1.2,0.15843839645385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,16,power_law_1.01,0.07237759828567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,64,power_law_1.01,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,16,power_law_1.2,0.04289279878139496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,32,power_law_1.2,0.20760319232940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,64,power_law_1.01,0.060153597593307497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,16,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,16,power_law_1.2,0.049856001138687135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,32,power_law_1.2,0.24774401187896727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,64,power_law_1.01,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,16,power_law_1.01,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,16,power_law_1.2,0.05416319966316223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,64,power_law_1.01,0.0654591977596283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,32,power_law_1.2,0.34603519439697267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,16,power_law_1.01,0.0965503990650177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,16,power_law_1.2,0.058271998167037965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,64,power_law_1.01,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,16,power_law_1.01,0.11579519510269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,32,power_law_1.2,0.4226367950439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,16,power_law_1.2,0.07054719924926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,64,power_law_1.01,0.07059839963912964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,16,power_law_1.01,0.1393407940864563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,32,power_law_1.2,0.5596415996551514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,16,power_law_1.2,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,64,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,16,power_law_1.01,0.1774399995803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,32,power_law_1.2,0.7757120132446289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,16,power_law_1.2,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,64,power_law_1.01,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,16,power_law_1.01,0.23968639373779296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,32,power_law_1.2,0.9420160293579102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,16,power_law_1.2,0.07646719813346863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,64,power_law_1.01,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,16,power_law_1.01,0.3601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,32,power_law_1.2,1.543295955657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,16,power_law_1.2,0.06974080204963684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,64,power_law_1.01,0.07651839852333069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,16,power_law_1.01,0.47071361541748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,16,power_law_1.2,0.08631680011749268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,64,power_law_1.01,0.07486720085144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,32,power_law_1.2,3.068032073974609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,16,power_law_1.01,0.644985580444336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,16,power_law_1.2,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,64,power_law_1.01,0.07817599773406983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,16,power_law_1.01,0.8866559982299804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,16,power_law_1.2,0.13155839443206788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,64,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,16,power_law_1.2,0.18687360286712645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,16,power_law_1.01,1.1252415657043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,64,power_law_1.01,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,16,power_law_1.01,0.0744704008102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,16,power_law_1.2,0.22863359451293946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,64,power_law_1.01,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,16,power_law_1.01,0.08554880023002624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,16,power_law_1.01,1.799238395690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,16,power_law_1.2,0.3355520009994507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,64,power_law_1.01,0.10764800310134888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,16,power_law_1.01,0.0658623993396759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,16,power_law_1.01,3.5044097900390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.01,0.11993600130081176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,16,power_law_1.01,0.0654528021812439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,16,power_law_1.2,0.435481595993042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.01,0.14083199501037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,16,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,16,power_law_1.2,0.6404736042022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.01,0.15312000513076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,16,power_law_1.01,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,16,power_law_1.2,0.845088005065918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,16,power_law_1.2,0.07195519804954528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.01,0.19900159835815429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,16,power_law_1.01,0.07711359858512878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,16,power_law_1.2,1.0509119987487794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,16,power_law_1.2,0.08856959939002991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,16,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.01,0.22766718864440919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,16,power_law_1.2,1.6644863128662108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,16,power_law_1.2,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,16,power_law_1.01,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.01,0.30058879852294923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,16,power_law_1.2,0.06478719711303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,16,power_law_1.01,0.08409600257873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.01,0.36161279678344727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,16,power_law_1.2,3.3012542724609375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,16,power_law_1.2,0.06887680292129517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,16,power_law_1.01,0.08409600257873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.01,0.5059904098510742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,16,power_law_1.2,0.07257599830627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,16,power_law_1.01,0.08798080086708068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.01,0.7105792045593262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,8,power_law_1.01,0.02139520049095154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,16,power_law_1.2,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,16,power_law_1.01,0.0875711977481842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,64,power_law_1.01,0.8445311546325683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,8,power_law_1.01,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,16,power_law_1.2,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,16,power_law_1.01,0.08922240138053894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,8,power_law_1.01,0.023027199506759643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,64,power_law_1.01,1.2518719673156737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,16,power_law_1.2,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,16,power_law_1.01,0.09679359793663025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,8,power_law_1.01,0.02322559952735901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,16,power_law_1.2,0.08220800161361694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,16,power_law_1.01,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,64,power_law_1.01,2.555423927307129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,8,power_law_1.01,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,16,power_law_1.2,0.08426880240440368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,16,power_law_1.01,0.10723199844360351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,8,power_law_1.01,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,16,power_law_1.2,0.08528640270233154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,16,power_law_1.01,0.11543680429458618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,8,power_law_1.01,0.031219199299812317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,16,power_law_1.2,0.08751999735832214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,16,power_law_1.01,0.1322175979614258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,8,power_law_1.2,0.022047999501228332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,8,power_law_1.01,0.03491199910640717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,16,power_law_1.2,0.09059839844703674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,16,power_law_1.01,0.15454720258712767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,8,power_law_1.2,0.024307200312614442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,8,power_law_1.01,0.04351359903812409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,16,power_law_1.2,0.09572479724884034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,16,power_law_1.01,0.17133439779281617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,8,power_law_1.2,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,8,power_law_1.01,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,16,power_law_1.2,0.10001280307769775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,8,power_law_1.2,0.02449920028448105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,16,power_law_1.01,0.21518080234527587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,8,power_law_1.01,0.05127679705619812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,16,power_law_1.2,0.10739840269088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,8,power_law_1.2,0.02861439883708954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,16,power_law_1.01,0.2430272102355957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,8,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,16,power_law_1.2,0.12951040267944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,8,power_law_1.2,0.031052801012992858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,16,power_law_1.01,0.32351999282836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,8,power_law_1.01,0.06706560254096985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,16,power_law_1.2,0.14057600498199463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,8,power_law_1.2,0.03578239977359772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,16,power_law_1.01,0.40993919372558596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,8,power_law_1.01,0.08241919875144958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,16,power_law_1.2,0.16167680025100709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,8,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,16,power_law_1.01,0.5657792091369629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,8,power_law_1.01,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,8,power_law_1.2,0.047865599393844604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,16,power_law_1.2,0.18050559759140014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,16,power_law_1.01,0.6937920093536377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,8,power_law_1.01,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,8,power_law_1.2,0.050323200225830075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,16,power_law_1.2,0.22597761154174806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,16,power_law_1.01,0.8789312362670898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,8,power_law_1.01,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,8,power_law_1.2,0.055027198791503903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,16,power_law_1.2,0.259769606590271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,16,power_law_1.01,1.3829504013061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,8,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,8,power_law_1.2,0.06157439947128296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,16,power_law_1.2,0.33780479431152344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,8,power_law_1.2,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,8,power_law_1.01,0.10820480585098266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,16,power_law_1.01,2.7514047622680664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,16,power_law_1.2,0.426259183883667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,8,power_law_1.2,0.08532480001449586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,8,power_law_1.01,0.11763199567794799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,16,power_law_1.2,0.652780818939209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,8,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,8,power_law_1.01,0.14713599681854247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,16,power_law_1.2,0.8354496002197266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,8,power_law_1.2,0.07797120213508606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,8,power_law_1.01,0.20876801013946533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,8,power_law_1.01,0.07774080038070678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,16,power_law_1.2,1.007084846496582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,8,power_law_1.2,0.09415040016174317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,8,power_law_1.01,0.25832960605621336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,8,power_law_1.01,0.08206080198287964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,16,power_law_1.2,1.6222976684570312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,8,power_law_1.2,0.0902463972568512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,8,power_law_1.01,0.38020479679107666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,8,power_law_1.01,0.0654591977596283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,8,power_law_1.2,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,8,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,8,power_law_1.01,0.4883264064788818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,16,power_law_1.2,3.097875213623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,8,power_law_1.2,0.11790720224380494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,8,power_law_1.01,0.07200639843940734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,8,power_law_1.01,0.7186944007873535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,8,power_law_1.2,0.14615039825439452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,8,power_law_1.01,0.08039680123329163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,8,power_law_1.01,0.9476287841796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,8,power_law_1.2,0.19467519521713256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,8,power_law_1.01,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,8,power_law_1.2,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,8,power_law_1.01,1.1789055824279786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,8,power_law_1.01,0.09249280095100403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,8,power_law_1.2,0.24732799530029298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,8,power_law_1.2,0.08240000009536744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,8,power_law_1.01,1.8701120376586915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,8,power_law_1.01,0.09575039744377137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,8,power_law_1.2,0.3468480110168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,8,power_law_1.2,0.06398079991340637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,8,power_law_1.01,0.09781119823455811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,8,power_law_1.2,0.4416831970214844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,8,power_law_1.01,3.7073665618896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,8,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,8,power_law_1.01,0.0992576003074646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,8,power_law_1.2,0.0738048017024994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,8,power_law_1.2,0.6491456031799316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,8,power_law_1.01,0.10254080295562744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,8,power_law_1.2,0.07914239764213563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,8,power_law_1.2,0.8515007972717286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,4,power_law_1.01,0.021996800601482392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,8,power_law_1.01,0.10601600408554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,8,power_law_1.2,0.08589439988136291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,8,power_law_1.2,1.0782143592834472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,4,power_law_1.01,0.02220800071954727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,8,power_law_1.01,0.10641920566558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,8,power_law_1.2,0.09285119771957398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,8,power_law_1.2,1.6821504592895509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,4,power_law_1.01,0.02343679964542389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,8,power_law_1.01,0.11112960577011108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,8,power_law_1.2,0.09100800156593322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,4,power_law_1.01,0.02650879919528961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,8,power_law_1.01,0.11338239908218384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,8,power_law_1.2,0.09530879855155945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,8,power_law_1.2,3.4315521240234377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,4,power_law_1.01,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,8,power_law_1.01,0.13038079738616942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,8,power_law_1.2,0.10083839893341065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,4,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,8,power_law_1.01,0.1404096007347107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,8,power_law_1.2,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,4,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,4,power_law_1.2,0.0212351992726326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,8,power_law_1.01,0.15843839645385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,8,power_law_1.2,0.10043519735336304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,4,power_law_1.01,0.03962239921092987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,4,power_law_1.2,0.022867199778556824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,8,power_law_1.01,0.18506239652633666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,8,power_law_1.2,0.10739840269088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,4,power_law_1.01,0.04371840059757233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,4,power_law_1.2,0.023071999847888946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,8,power_law_1.01,0.20471680164337158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,8,power_law_1.2,0.11354240179061889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,4,power_law_1.01,0.05231999754905701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,4,power_law_1.2,0.027372801303863527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,8,power_law_1.01,0.2550784111022949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,8,power_law_1.2,0.11967999935150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,4,power_law_1.01,0.05846400260925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,4,power_law_1.2,0.030854400992393494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,8,power_law_1.01,0.29894399642944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,8,power_law_1.2,0.13422080278396606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,4,power_law_1.01,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,4,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,8,power_law_1.01,0.3777856111526489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,8,power_law_1.2,0.1503872036933899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,4,power_law_1.01,0.07648000121116638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,4,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,8,power_law_1.2,0.16760319471359253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,8,power_law_1.01,0.47813119888305666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,4,power_law_1.01,0.09205120205879211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,4,power_law_1.2,0.0427264004945755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,8,power_law_1.2,0.1966976046562195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,8,power_law_1.01,0.6798719882965087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,4,power_law_1.01,0.07196159958839417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,4,power_law_1.2,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,8,power_law_1.2,0.20611200332641602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,8,power_law_1.01,0.8301823616027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,4,power_law_1.01,0.08549119830131531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,4,power_law_1.2,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,8,power_law_1.2,0.262227201461792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,8,power_law_1.01,1.0365951538085938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,4,power_law_1.01,0.10557440519332886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,4,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,8,power_law_1.2,0.3081023931503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,8,power_law_1.01,1.5830143928527831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,4,power_law_1.01,0.10576640367507935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,4,power_law_1.2,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,8,power_law_1.2,0.4178624153137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,8,power_law_1.01,3.039366340637207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,4,power_law_1.01,0.13033599853515626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,4,power_law_1.2,0.07198079824447631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,8,power_law_1.2,0.4944767951965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,4,power_law_1.2,0.08880640268325805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,4,power_law_1.01,0.14304640293121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,8,power_law_1.2,0.7367487907409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,4,power_law_1.2,0.07468799948692321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,4,power_law_1.01,0.17909120321273803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,8,power_law_1.2,0.9431872367858887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,4,power_law_1.2,0.08186240196228027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,4,power_law_1.01,0.24583680629730226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,8,power_law_1.2,1.1285375595092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,4,power_law_1.01,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,4,power_law_1.2,0.09843840003013611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,4,power_law_1.01,0.3126015901565552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,8,power_law_1.2,1.7902463912963866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,4,power_law_1.01,0.08349440097808838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,4,power_law_1.2,0.09701759815216064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,4,power_law_1.01,0.45557122230529784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,4,power_law_1.01,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,4,power_law_1.2,0.11665920019149781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,4,power_law_1.01,0.6120192050933838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,8,power_law_1.2,3.9926528930664062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,4,power_law_1.01,0.0756928026676178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,4,power_law_1.2,0.1252671957015991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,4,power_law_1.01,0.8981247901916504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,4,power_law_1.01,0.08615040183067321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,4,power_law_1.2,0.15456000566482545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,4,power_law_1.01,1.1957056045532226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,4,power_law_1.01,0.09801599979400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,4,power_law_1.2,0.2051392078399658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,4,power_law_1.01,1.4913151741027832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,4,power_law_1.01,0.11502079963684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,4,power_law_1.2,0.2485503911972046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,4,power_law_1.2,0.07626240253448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,4,power_law_1.01,0.11891839504241944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,4,power_law_1.01,2.3243263244628904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,4,power_law_1.2,0.35382399559020994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,4,power_law_1.2,0.08569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,4,power_law_1.01,0.12280960083007812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,4,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,4,power_law_1.2,0.46871042251586914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,4,power_law_1.01,4.6222270965576175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,4,power_law_1.01,0.12280319929122925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,4,power_law_1.2,0.07504640221595764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,4,power_law_1.2,0.6417727947235108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,4,power_law_1.01,0.12566399574279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,4,power_law_1.2,0.08485760092735291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,4,power_law_1.2,0.8396096229553223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,4,power_law_1.01,0.13182079792022705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,4,power_law_1.2,0.09736319780349731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,64,power_law_1.01,0.02038400024175644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,4,power_law_1.2,1.0753279685974122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,4,power_law_1.01,0.13857920169830323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,4,power_law_1.2,0.11538560390472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,64,power_law_1.01,0.020153599977493285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,4,power_law_1.01,0.139193594455719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,4,power_law_1.2,1.701817512512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,4,power_law_1.2,0.11804800033569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,64,power_law_1.01,0.020153599977493285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,4,power_law_1.01,0.15127040147781373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,64,power_law_1.01,0.01995519995689392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,4,power_law_1.2,0.1223423957824707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,4,power_law_1.2,3.258707046508789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,4,power_law_1.01,0.15576959848403932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,64,power_law_1.01,0.021587200462818146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,4,power_law_1.2,0.12399359941482543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,4,power_law_1.01,0.1703104019165039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,64,power_law_1.01,0.025696000456809996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,4,power_law_1.2,0.12848639488220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,64,power_law_1.01,0.02733440101146698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,4,power_law_1.01,0.18179839849472046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,4,power_law_1.2,0.13381119966506957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,64,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,64,power_law_1.01,0.02794879972934723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,4,power_law_1.01,0.2120896100997925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,4,power_law_1.2,0.1389248013496399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,64,power_law_1.2,0.019193600118160247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,64,power_law_1.01,0.030796799063682555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,4,power_law_1.01,0.25265278816223147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,64,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,4,power_law_1.2,0.14670079946517944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,64,power_law_1.01,0.03203839957714081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,4,power_law_1.01,0.2764159917831421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,64,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,4,power_law_1.2,0.15286400318145751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,64,power_law_1.01,0.03733760118484497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,64,power_law_1.2,0.020627200603485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,4,power_law_1.01,0.34070401191711425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,4,power_law_1.2,0.1565440058708191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,64,power_law_1.01,0.03162879943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,64,power_law_1.2,0.024928000569343568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,4,power_law_1.01,0.40073599815368655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,64,power_law_1.01,0.033267199993133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,4,power_law_1.2,0.17006720304489137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,64,power_law_1.2,0.026348799467086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,64,power_law_1.01,0.03777920007705689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,4,power_law_1.01,0.5252352237701416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,4,power_law_1.2,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,64,power_law_1.2,0.026976001262664796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,64,power_law_1.01,0.03450239896774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,4,power_law_1.01,0.6396992206573486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,4,power_law_1.2,0.21225600242614745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,64,power_law_1.2,0.029625600576400755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,64,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,4,power_law_1.2,0.2542399883270264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,4,power_law_1.01,0.9698559761047363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,64,power_law_1.2,0.031673601269721983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,64,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,4,power_law_1.2,0.28372480869293215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,64,power_law_1.2,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,4,power_law_1.01,1.1408767700195312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,64,power_law_1.01,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,64,power_law_1.2,0.033318400382995605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,4,power_law_1.2,0.36687359809875486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.01,0.06111999750137329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,4,power_law_1.01,1.4349568367004395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,64,power_law_1.2,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.01,0.08814079761505127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,4,power_law_1.2,0.4139840126037598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,4,power_law_1.01,2.2238527297973634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,64,power_law_1.2,0.03883520066738129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.01,0.08917120099067688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,4,power_law_1.2,0.5624639987945557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,64,power_law_1.2,0.03454720079898834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.01,0.15450880527496338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,4,power_law_1.01,4.462739181518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,4,power_law_1.2,0.6757056236267089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,64,power_law_1.2,0.03944959938526153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.01,0.1841920018196106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,4,power_law_1.2,0.9665280342102051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,64,power_law_1.2,0.0429504007101059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.01,0.262227201461792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,64,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,4,power_law_1.2,1.3026047706604005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.01,0.3814143896102905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,64,power_law_1.01,0.03985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.2,0.06771199703216553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,64,power_law_1.01,0.04251520037651062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.01,0.5497536182403564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,4,power_law_1.2,1.4981823921203614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.2,0.09292160272598267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,64,power_law_1.01,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.01,0.7158720016479492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,4,power_law_1.2,2.3571199417114257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.2,0.11870720386505126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,64,power_law_1.01,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,64,power_law_1.01,1.0078975677490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.2,0.16090879440307618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,64,power_law_1.01,0.03904640078544617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,4,power_law_1.2,5.250118255615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,64,power_law_1.01,1.421388816833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.2,0.2239743947982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,64,power_law_1.01,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,64,power_law_1.01,0.040057599544525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.2,0.32289919853210447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,64,power_law_1.01,2.6225408554077148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,64,power_law_1.01,0.040678399801254275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.2,0.4136256217956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,64,power_law_1.2,0.0525056004524231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,64,power_law_1.01,0.04128639996051788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.2,0.6614272117614746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,64,power_law_1.2,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,64,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,64,power_law_1.2,0.04063999950885773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.2,0.8740032196044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,32,power_law_1.01,0.01913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,64,power_law_1.01,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,64,power_law_1.2,0.04083200097084046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,64,power_law_1.2,1.0839424133300781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,32,power_law_1.01,0.01934719979763031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,64,power_law_1.01,0.041920000314712526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,64,power_law_1.2,0.03960959911346436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,32,power_law_1.01,0.01992959976196289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,64,power_law_1.2,1.7542335510253906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,64,power_law_1.01,0.042931199073791504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,64,power_law_1.2,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,32,power_law_1.01,0.01932159960269928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,64,power_law_1.01,0.04415999948978424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,64,power_law_1.2,0.04165120124816894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,64,power_law_1.2,3.488486480712891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,32,power_law_1.01,0.022598400712013245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,64,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,64,power_law_1.2,0.040608000755310056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,32,power_law_1.01,0.02426239997148514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,64,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,64,power_law_1.2,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,32,power_law_1.01,0.026713600754737853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,64,power_law_1.01,0.05297279953956604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,64,power_law_1.2,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,32,power_law_1.01,0.028352001309394838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,32,power_law_1.2,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,64,power_law_1.01,0.058899199962615965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,64,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,32,power_law_1.01,0.030406400561332703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,32,power_law_1.2,0.018374399840831758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.01,0.0652671992778778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,64,power_law_1.2,0.04347519874572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,32,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,32,power_law_1.2,0.018367999792099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.01,0.07426559925079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,64,power_law_1.2,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,32,power_law_1.01,0.03511680066585541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,32,power_law_1.2,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.01,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,64,power_law_1.2,0.0455487996339798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,32,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,32,power_law_1.2,0.021433599293231964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.01,0.11011840105056762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,64,power_law_1.2,0.04922240078449249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,32,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,32,power_law_1.2,0.02348800003528595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.01,0.11706880331039429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,64,power_law_1.2,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,32,power_law_1.01,0.03715839982032776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,32,power_law_1.2,0.024505600333213806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.01,0.15474560260772705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,64,power_law_1.2,0.057011198997497556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,32,power_law_1.01,0.036345601081848145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,32,power_law_1.2,0.028601598739624024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.01,0.1932479977607727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,64,power_law_1.2,0.06172159910202026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,32,power_law_1.01,0.04002560079097748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,32,power_law_1.2,0.031488001346588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.01,0.2817280054092407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.2,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,32,power_law_1.01,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,32,power_law_1.2,0.03331199884414673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.01,0.3374527931213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.2,0.08056319952011108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,32,power_law_1.01,0.04963839948177338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,32,power_law_1.2,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.2,0.09100160002708435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,64,power_law_1.01,0.4230527877807617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,32,power_law_1.01,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,32,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.2,0.1192639946937561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,64,power_law_1.01,0.6876416206359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,32,power_law_1.01,0.07586560249328614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,32,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.2,0.14487680196762084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,32,power_law_1.01,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,32,power_law_1.2,0.037215998768806456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,64,power_law_1.01,1.5985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.2,0.20755200386047362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,32,power_law_1.01,0.1307584047317505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,32,power_law_1.2,0.03739520013332367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.2,0.2890431880950928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,32,power_law_1.01,0.1651584029197693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,32,power_law_1.2,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.2,0.35192320346832273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,32,power_law_1.01,0.04928640127182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,32,power_law_1.2,0.04046719968318939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,32,power_law_1.01,0.22104959487915038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.2,0.576800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,32,power_law_1.01,0.04395520091056824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,32,power_law_1.2,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,32,power_law_1.01,0.2937664031982422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,64,power_law_1.2,0.6046463966369628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,32,power_law_1.01,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,32,power_law_1.2,0.06485120058059693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,32,power_law_1.01,0.445740795135498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,32,power_law_1.01,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,32,power_law_1.2,0.0828607976436615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,64,power_law_1.2,1.2096256256103515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,32,power_law_1.01,0.6380288124084472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,32,power_law_1.01,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,32,power_law_1.2,0.10314240455627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,32,power_law_1.01,0.7768767833709717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,64,power_law_1.2,2.4996543884277345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,32,power_law_1.01,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,32,power_law_1.2,0.14001280069351196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,32,power_law_1.01,1.2675840377807617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,32,power_law_1.01,0.04128639996051788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,32,power_law_1.2,0.18262399435043336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,32,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,32,power_law_1.2,0.2989248037338257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,32,power_law_1.01,2.4222272872924804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,32,power_law_1.2,0.0471807986497879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,32,power_law_1.01,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,32,power_law_1.2,0.3669312000274658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,32,power_law_1.2,0.040012800693511964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,32,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,32,power_law_1.2,0.5567808151245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,32,power_law_1.2,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,32,power_law_1.01,0.043136000633239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,32,power_law_1.2,0.6565120220184326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,32,power_law_1.2,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,32,power_law_1.01,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,16,power_law_1.01,0.01995519995689392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,32,power_law_1.2,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,32,power_law_1.2,0.8510848045349121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,32,power_law_1.01,0.043750399351119997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,16,power_law_1.01,0.019750399887561797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,32,power_law_1.2,0.040217599272727965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,32,power_law_1.01,0.04580479860305786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,16,power_law_1.01,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,32,power_law_1.2,1.4752896308898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,32,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,32,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,16,power_law_1.01,0.019750399887561797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,32,power_law_1.2,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,32,power_law_1.2,3.001683235168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,32,power_law_1.01,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,16,power_law_1.01,0.020160000026226043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,32,power_law_1.2,0.042483198642730716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,32,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,16,power_law_1.01,0.021593600511550903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,32,power_law_1.2,0.04226559996604919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,32,power_law_1.01,0.05869439840316772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,16,power_law_1.01,0.024223999679088594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,32,power_law_1.2,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,32,power_law_1.01,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,16,power_law_1.01,0.025670400261878966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,16,power_law_1.2,0.01897599995136261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,32,power_law_1.2,0.04451839923858643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,32,power_law_1.01,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,16,power_law_1.01,0.028358399868011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,16,power_law_1.2,0.01834239959716797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,32,power_law_1.2,0.046367999911308286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,16,power_law_1.01,0.031020799279212953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,32,power_law_1.01,0.08430079817771911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,16,power_law_1.2,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,16,power_law_1.01,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,32,power_law_1.2,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,32,power_law_1.01,0.11338880062103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,16,power_law_1.2,0.018771199882030486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,16,power_law_1.01,0.031014400720596313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,32,power_law_1.2,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,32,power_law_1.01,0.12424319982528687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,16,power_law_1.2,0.020422400534152986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,16,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,32,power_law_1.2,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,32,power_law_1.01,0.15884799957275392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,16,power_law_1.2,0.0212351992726326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,16,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,32,power_law_1.2,0.05557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,32,power_law_1.01,0.20717439651489258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,16,power_law_1.2,0.022873599827289582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,16,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,32,power_law_1.2,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,32,power_law_1.01,0.2874687910079956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,16,power_law_1.2,0.02513279914855957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,16,power_law_1.01,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,32,power_law_1.2,0.06971520185470581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,16,power_law_1.2,0.028204798698425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,32,power_law_1.01,0.3407232046127319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,16,power_law_1.01,0.0433023989200592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,32,power_law_1.2,0.07850880026817322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,16,power_law_1.2,0.031065601110458373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,32,power_law_1.01,0.41773438453674316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,16,power_law_1.01,0.049395200610160825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,32,power_law_1.2,0.09756799936294555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,16,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,32,power_law_1.01,0.6466879844665527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,16,power_law_1.01,0.05496320128440857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,32,power_law_1.2,0.12092159986495972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,16,power_law_1.2,0.03147520124912262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,16,power_law_1.01,0.07382400035858154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,32,power_law_1.2,0.14590079784393312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,16,power_law_1.2,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,32,power_law_1.01,1.5281344413757325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,16,power_law_1.01,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,16,power_law_1.2,0.03699199855327606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,32,power_law_1.2,0.20160000324249266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,16,power_law_1.01,0.1121216058731079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,16,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,32,power_law_1.2,0.2382591962814331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,16,power_law_1.01,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,16,power_law_1.01,0.1485759973526001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,32,power_law_1.2,0.3910399913787842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,16,power_law_1.01,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,16,power_law_1.01,0.20181119441986084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,32,power_law_1.2,0.4596543788909912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,16,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,16,power_law_1.01,0.289465594291687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,32,power_law_1.2,0.6531904220581055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,16,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,16,power_law_1.01,0.40887041091918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,32,power_law_1.2,1.072812843322754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,16,power_law_1.01,0.042335999011993405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,16,power_law_1.01,0.5415679931640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,16,power_law_1.01,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,32,power_law_1.2,2.512358474731445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,16,power_law_1.01,0.6333375930786133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,16,power_law_1.01,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,16,power_law_1.01,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,16,power_law_1.01,1.1084608078002929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,16,power_law_1.01,0.04496000111103058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,16,power_law_1.2,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,16,power_law_1.01,2.272307205200195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,16,power_law_1.01,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,16,power_law_1.2,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,16,power_law_1.01,0.04661119878292084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,16,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,16,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,32,power_law_1.01,0.02139520049095154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,16,power_law_1.2,0.04043520092964172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,16,power_law_1.01,0.047225600481033324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,32,power_law_1.01,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,16,power_law_1.2,0.04204800128936768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,16,power_law_1.01,0.049702399969100954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,32,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,16,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,16,power_law_1.01,0.053600001335144046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,32,power_law_1.01,0.021376000344753267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,16,power_law_1.2,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,16,power_law_1.01,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,32,power_law_1.01,0.02157440036535263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,16,power_law_1.2,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,16,power_law_1.01,0.058931201696395874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,32,power_law_1.01,0.024038399755954742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,16,power_law_1.2,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,16,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,32,power_law_1.01,0.02733440101146698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,16,power_law_1.2,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,16,power_law_1.01,0.07140480279922486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,16,power_law_1.2,0.046777600049972536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,32,power_law_1.01,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,16,power_law_1.01,0.08553599715232849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,16,power_law_1.2,0.04780159890651703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,32,power_law_1.01,0.033888000249862674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,16,power_law_1.2,0.04799999892711639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,32,power_law_1.01,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,16,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,32,power_law_1.01,0.04166400134563446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,16,power_law_1.2,0.05415679812431336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,32,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,16,power_law_1.2,0.05863680243492127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,32,power_law_1.01,0.037574398517608645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,16,power_law_1.2,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,32,power_law_1.01,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,16,power_law_1.2,0.06766719818115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,32,power_law_1.01,0.048825600743293764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,16,power_law_1.2,0.07463039755821228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,32,power_law_1.01,0.040031999349594116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,16,power_law_1.2,0.09427840113639832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,32,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,16,power_law_1.2,0.10084480047225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,32,power_law_1.01,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,16,power_law_1.2,0.13033599853515626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,32,power_law_1.01,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,16,power_law_1.2,0.1508095979690552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,32,power_law_1.01,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,16,power_law_1.2,0.2016063928604126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,32,power_law_1.01,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,16,power_law_1.2,0.23969919681549073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,32,power_law_1.01,0.1590208053588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,16,power_law_1.2,0.3318592071533203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,32,power_law_1.01,0.20446720123291015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,32,power_law_1.01,0.2947968006134033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,16,power_law_1.2,0.5784383773803711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,32,power_law_1.01,0.3838720083236694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,16,power_law_1.2,0.7183167934417725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,32,power_law_1.01,0.5649216175079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,16,power_law_1.2,1.1187071800231934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,32,power_law_1.01,0.7469696044921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,16,power_law_1.2,2.543903923034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,32,power_law_1.01,0.9227583885192872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,32,power_law_1.01,1.4635647773742675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,32,power_law_1.01,2.9061887741088865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,2,32,power_law_1.2,0.02341119945049286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,2,32,power_law_1.2,0.022201600670814513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,2,32,power_law_1.2,0.023014399409294128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,2,32,power_law_1.2,0.02280319929122925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,32,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,2,32,power_law_1.2,0.025062400102615356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,32,power_law_1.01,0.0650111973285675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,2,32,power_law_1.2,0.030393600463867188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,32,power_law_1.01,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,2,32,power_law_1.2,0.03407999873161316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,32,power_law_1.01,0.058259201049804685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,2,32,power_law_1.2,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,32,power_law_1.01,0.05989760160446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,2,32,power_law_1.2,0.04287999868392944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,32,power_law_1.01,0.06357759833335877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,2,32,power_law_1.2,0.045747199654579164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,32,power_law_1.01,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,2,32,power_law_1.2,0.053324800729751584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,32,power_law_1.01,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,2,32,power_law_1.2,0.06377599835395813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,32,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,2,32,power_law_1.2,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,32,power_law_1.01,0.06624000072479248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,2,32,power_law_1.2,0.057011198997497556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,32,power_law_1.01,0.06747519969940186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,32,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,2,32,power_law_1.2,0.06663680076599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,32,power_law_1.01,0.07013760209083557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,2,32,power_law_1.2,0.05251200199127197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,32,power_law_1.01,0.07115520238876342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,2,32,power_law_1.2,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,32,power_law_1.01,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,2,32,power_law_1.2,0.08569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,32,power_law_1.01,0.08243200182914734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,2,32,power_law_1.2,0.10862720012664795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,32,power_law_1.01,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,2,32,power_law_1.2,0.13525760173797607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,32,power_law_1.01,0.10351359844207764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,2,32,power_law_1.2,0.19668480157852172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,32,power_law_1.01,0.11253119707107544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,2,32,power_law_1.2,0.2753407955169678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,32,power_law_1.01,0.1307584047317505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,2,32,power_law_1.2,0.36066560745239257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,32,power_law_1.01,0.14262399673461915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,2,32,power_law_1.2,0.5464831829071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,32,power_law_1.01,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,2,32,power_law_1.2,0.7437119960784913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,32,power_law_1.01,0.20858240127563477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,2,32,power_law_1.2,1.0699520111083984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,32,power_law_1.01,0.289683198928833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,2,32,power_law_1.2,1.3968064308166503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,32,power_law_1.01,0.3562432050704956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,2,32,power_law_1.2,1.7337152481079101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,32,power_law_1.01,0.4838143825531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,2,32,power_law_1.2,3.4077503204345705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,32,power_law_1.01,0.6454207897186279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,32,power_law_1.01,0.7179200172424316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,2,32,power_law_1.2,6.8668159484863285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,32,power_law_1.01,1.1288384437561034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,32,power_law_1.01,2.5090688705444335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,2,32,power_law_1.2,0.09018880128860474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,2,32,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,2,32,power_law_1.2,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,2,32,power_law_1.2,0.05803520083427429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,16,power_law_1.01,0.02078080028295517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,2,32,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,16,power_law_1.01,0.021792000532150267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,2,32,power_law_1.2,0.06233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,16,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,2,32,power_law_1.2,0.06214399933815003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,16,power_law_1.01,0.022009600698947907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,2,32,power_law_1.2,0.06499840021133423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,16,power_law_1.01,0.02568959891796112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,2,32,power_law_1.2,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,16,power_law_1.01,0.02630400061607361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,16,power_law_1.01,0.030406400561332703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,2,32,power_law_1.2,0.06684799790382386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,16,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,2,32,power_law_1.2,0.0686784029006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,16,power_law_1.01,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,2,32,power_law_1.2,0.06888319849967957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,16,power_law_1.01,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,2,32,power_law_1.2,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,16,power_law_1.01,0.04821760058403015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,2,32,power_law_1.2,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,16,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,2,32,power_law_1.2,0.08117759823799134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,16,power_law_1.01,0.04576640129089356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,2,32,power_law_1.2,0.08363519906997681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,16,power_law_1.01,0.05170559883117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,2,32,power_law_1.2,0.09224960207939148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,16,power_law_1.01,0.057030397653579715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,2,32,power_law_1.2,0.10329600572586059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,16,power_law_1.01,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,2,32,power_law_1.2,0.11989120244979859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,16,power_law_1.01,0.05538560152053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,2,32,power_law_1.2,0.13525760173797607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,16,power_law_1.01,0.06357759833335877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,2,32,power_law_1.2,0.14978560209274291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,16,power_law_1.01,0.0807807981967926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,2,32,power_law_1.2,0.1962815999984741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,16,power_law_1.01,0.10679039955139161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,2,32,power_law_1.2,0.23335039615631104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,16,power_law_1.01,0.13014400005340576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,2,32,power_law_1.2,0.32858240604400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,16,power_law_1.01,0.1788607954978943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,2,32,power_law_1.2,0.4252480030059814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,16,power_law_1.01,0.2280128002166748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,2,32,power_law_1.2,0.5571392059326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,16,power_law_1.01,0.33187839984893797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,2,32,power_law_1.2,0.6711935997009277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,16,power_law_1.01,0.43547520637512205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,2,32,power_law_1.2,1.060095977783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,16,power_law_1.01,0.6404863834381104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,2,32,power_law_1.2,1.7525503158569335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,16,power_law_1.01,0.844268798828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,16,power_law_1.01,1.051257610321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,2,32,power_law_1.2,3.611110305786133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,16,power_law_1.01,1.6649087905883788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,16,power_law_1.2,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,16,power_law_1.2,0.04314880073070526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,16,power_law_1.01,3.295084762573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,16,power_law_1.2,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,16,power_law_1.2,0.05749120116233826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,16,power_law_1.2,0.026086398959159852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,16,power_law_1.2,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,16,power_law_1.2,0.022809599339962006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,16,power_law_1.01,0.07992320060729981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,16,power_law_1.2,0.08942720293998718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,16,power_law_1.2,0.023628799617290495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,16,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,16,power_law_1.2,0.12732800245285034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,16,power_law_1.2,0.024639999866485594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,16,power_law_1.01,0.05969280004501343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,16,power_law_1.2,0.16500480175018312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,16,power_law_1.2,0.028960001468658448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,16,power_law_1.01,0.06050559878349304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,16,power_law_1.2,0.23851521015167237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,16,power_law_1.2,0.033055999875068666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,16,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,16,power_law_1.2,0.30201599597930906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,16,power_law_1.2,0.03776639997959137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,16,power_law_1.01,0.06869760155677795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,16,power_law_1.2,0.47322878837585447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,16,power_law_1.2,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,16,power_law_1.01,0.06991360187530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,16,power_law_1.2,0.6075776100158692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,16,power_law_1.2,0.046163201332092285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,16,power_law_1.01,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,16,power_law_1.2,0.740070390701294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,16,power_law_1.2,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,16,power_law_1.01,0.07075200080871583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,16,power_law_1.2,1.261683177947998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,16,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,16,power_law_1.2,0.053932797908782956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,16,power_law_1.01,0.07339519858360291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,16,power_law_1.2,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,16,power_law_1.2,2.407148742675781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,16,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,16,power_law_1.2,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,16,power_law_1.01,0.07893760204315185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,16,power_law_1.2,0.05824000239372253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,16,power_law_1.01,0.07910400032997131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,16,power_law_1.2,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,16,power_law_1.2,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,16,power_law_1.01,0.08569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,16,power_law_1.2,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,16,power_law_1.2,0.05748479962348938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,16,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,16,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,16,power_law_1.2,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,16,power_law_1.2,0.05911679863929749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,16,power_law_1.01,0.11604479551315308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,16,power_law_1.01,0.0965503990650177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,16,power_law_1.2,0.07955200076103211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,16,power_law_1.2,0.05931519865989685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,16,power_law_1.01,0.14371199607849122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,16,power_law_1.01,0.11354240179061889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,16,power_law_1.2,0.09735680222511292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,16,power_law_1.2,0.05848960280418396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,16,power_law_1.01,0.1711359977722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,16,power_law_1.01,0.12296960353851319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,16,power_law_1.2,0.12378879785537719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,16,power_law_1.2,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,16,power_law_1.01,0.22644479274749757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,16,power_law_1.01,0.14837119579315186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,16,power_law_1.2,0.16064640283584594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,16,power_law_1.2,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,16,power_law_1.01,0.16147199869155884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,16,power_law_1.01,0.33703041076660156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,16,power_law_1.2,0.22904319763183595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,16,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,16,power_law_1.01,0.1889024019241333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,16,power_law_1.01,0.42345600128173827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,16,power_law_1.2,0.2908992052078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,16,power_law_1.2,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,16,power_law_1.01,0.22760961055755616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,16,power_law_1.2,0.40782718658447265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,16,power_law_1.01,0.48510079383850097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,16,power_law_1.2,0.07223039865493774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,16,power_law_1.01,0.292742395401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,16,power_law_1.2,0.07344639897346497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,16,power_law_1.2,0.5481215953826905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,16,power_law_1.01,0.8277312278747558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,16,power_law_1.01,0.37363200187683104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,16,power_law_1.2,0.07367039918899536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,16,power_law_1.2,0.8538880348205566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,16,power_law_1.01,1.561740779876709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,16,power_law_1.01,0.5263807773590088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,16,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,16,power_law_1.2,1.161248016357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,16,power_law_1.2,0.07713279724121094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,16,power_law_1.01,0.6769472122192383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,16,power_law_1.2,1.5035136222839356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,16,power_law_1.2,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,16,power_law_1.01,0.8354559898376465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,16,power_law_1.2,2.267616081237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,64,power_law_1.01,0.09433599710464477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,16,power_law_1.2,0.08818560242652893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,16,power_law_1.01,1.293171215057373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,64,power_law_1.01,0.1191167950630188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,16,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,16,power_law_1.2,4.82597770690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,16,power_law_1.01,2.4877824783325195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,64,power_law_1.01,0.09086080193519593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,16,power_law_1.2,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,16,power_law_1.2,0.1301568031311035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,64,power_law_1.01,0.06197119951248169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,16,power_law_1.2,0.14615679979324342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,64,power_law_1.01,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,64,power_law_1.2,0.13381760120391845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,16,power_law_1.2,0.15700479745864868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,32,power_law_1.01,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,64,power_law_1.01,0.0748799979686737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,64,power_law_1.2,0.08978559970855712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,16,power_law_1.2,0.1994047999382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,32,power_law_1.01,0.10188159942626954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,64,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,64,power_law_1.2,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,16,power_law_1.2,0.25102078914642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,32,power_law_1.01,0.09491199851036072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,64,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,16,power_law_1.2,0.3370368003845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,64,power_law_1.2,0.06602240204811097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,32,power_law_1.01,0.06602240204811097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,16,power_law_1.2,0.4070784091949463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,64,power_law_1.01,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,64,power_law_1.2,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,32,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,16,power_law_1.2,0.5936511993408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,64,power_law_1.01,0.08594560027122497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,64,power_law_1.2,0.07461760044097901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,32,power_law_1.01,0.07504640221595764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,16,power_law_1.2,0.7871744155883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,64,power_law_1.01,0.0877888023853302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,64,power_law_1.2,0.07319039702415467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,32,power_law_1.01,0.07648640275001525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,16,power_law_1.2,0.9940352439880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,64,power_law_1.2,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,64,power_law_1.01,0.09205759763717651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,32,power_law_1.01,0.08035839796066284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,16,power_law_1.2,1.6125312805175782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,64,power_law_1.2,0.09101439714431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,64,power_law_1.01,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,32,power_law_1.01,0.08569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,64,power_law_1.01,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,64,power_law_1.2,0.08731520175933838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,32,power_law_1.01,0.08918399810791015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,16,power_law_1.2,3.511840057373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,64,power_law_1.01,0.10110080242156982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,64,power_law_1.2,0.08098559975624084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,32,power_law_1.01,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,64,power_law_1.01,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,32,power_law_1.01,0.09758080244064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,64,power_law_1.2,0.091430401802063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,32,power_law_1.2,0.08288000226020813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,64,power_law_1.01,0.10478719472885131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,32,power_law_1.01,0.09205120205879211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,64,power_law_1.2,0.08916479945182801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,32,power_law_1.2,0.095769602060318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,32,power_law_1.01,0.09676160216331482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,64,power_law_1.01,0.11667200326919555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,64,power_law_1.2,0.09141759872436524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,32,power_law_1.2,0.09189119935035706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,32,power_law_1.01,0.10536320209503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,64,power_law_1.2,0.09797120094299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,64,power_law_1.01,0.12855039834976195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,32,power_law_1.2,0.06403840184211732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,32,power_law_1.01,0.10556800365447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,64,power_law_1.2,0.1028864026069641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,64,power_law_1.01,0.1486143946647644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,32,power_law_1.01,0.11313920021057129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,32,power_law_1.2,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,64,power_law_1.2,0.10903680324554443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,64,power_law_1.01,0.17522560358047484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,32,power_law_1.01,0.12522879838943482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,64,power_law_1.2,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,32,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,64,power_law_1.01,0.21537280082702637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,32,power_law_1.01,0.13525760173797607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,32,power_law_1.2,0.0773311972618103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,64,power_law_1.2,0.13238400220870972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,64,power_law_1.01,0.24568960666656495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,32,power_law_1.01,0.15820159912109374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,32,power_law_1.2,0.0847104012966156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,64,power_law_1.2,0.1588096022605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,64,power_law_1.01,0.32106239795684816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,32,power_law_1.01,0.18339200019836427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,64,power_law_1.2,0.18012160062789917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,32,power_law_1.2,0.08492159843444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,64,power_law_1.01,0.4095295906066895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,32,power_law_1.01,0.22658560276031495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,32,power_law_1.2,0.08923519849777221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,64,power_law_1.2,0.2386687994003296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,64,power_law_1.01,0.5657855987548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,32,power_law_1.01,0.2622335910797119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,32,power_law_1.2,0.08819839954376221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,64,power_law_1.2,0.2683712005615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,64,power_law_1.01,0.7379839897155762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,32,power_law_1.01,0.3445503950119019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,32,power_law_1.2,0.09126399755477906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,64,power_law_1.2,0.3644223928451538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,64,power_law_1.01,0.8776960372924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,32,power_law_1.01,0.423199987411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,32,power_law_1.2,0.09167360067367554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,64,power_law_1.2,0.4457280158996582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,64,power_law_1.01,1.359590435028076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,32,power_law_1.2,0.09371520280838012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,32,power_law_1.01,0.5628672122955323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,64,power_law_1.2,0.6169280052185059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,64,power_law_1.01,2.742393684387207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,32,power_law_1.2,0.10089600086212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,32,power_law_1.01,0.7387904167175293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,64,power_law_1.2,0.8289024353027343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,32,power_law_1.2,0.10643839836120605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,32,power_law_1.01,0.8547136306762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,64,power_law_1.2,1.0513216018676759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,32,power_law_1.2,0.11360000371932984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,32,power_law_1.01,1.444320011138916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,64,power_law_1.2,1.7808256149291992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,16,power_law_1.01,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,32,power_law_1.2,0.12691199779510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,16,power_law_1.01,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,32,power_law_1.2,0.134278404712677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,32,power_law_1.01,2.617209625244141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,64,power_law_1.2,3.479020690917969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,16,power_law_1.01,0.10929280519485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,32,power_law_1.2,0.16622719764709473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,16,power_law_1.01,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,32,power_law_1.2,0.18097280263900756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,16,power_law_1.01,0.07099519968032837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,32,power_law_1.2,0.23545598983764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,16,power_law_1.2,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,8,power_law_1.01,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,16,power_law_1.01,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,16,power_law_1.2,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,32,power_law_1.2,0.26617600917816164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,8,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,16,power_law_1.2,0.08138880133628845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,16,power_law_1.01,0.08019199967384338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,32,power_law_1.2,0.35997440814971926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,8,power_law_1.01,0.10577919483184814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,16,power_law_1.2,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,16,power_law_1.01,0.09126399755477906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,32,power_law_1.2,0.4478208065032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,8,power_law_1.01,0.07257599830627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,16,power_law_1.2,0.07237120270729065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,16,power_law_1.01,0.09434239864349366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,32,power_law_1.2,0.6296832084655761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,8,power_law_1.01,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,16,power_law_1.2,0.07649919986724854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,16,power_law_1.01,0.09353600144386291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,8,power_law_1.01,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,32,power_law_1.2,0.7785727977752686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,16,power_law_1.2,0.08098559975624084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,16,power_law_1.01,0.09516159892082214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,8,power_law_1.01,0.09221760034561158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,32,power_law_1.2,1.0436032295227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,16,power_law_1.2,0.08570240139961242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,16,power_law_1.01,0.10049279928207397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,8,power_law_1.01,0.1041152000427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,32,power_law_1.2,1.634239959716797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,16,power_law_1.2,0.09223039746284485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,16,power_law_1.01,0.10089600086212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,8,power_law_1.01,0.10842239856719971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,16,power_law_1.2,0.09143679738044738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,32,power_law_1.2,3.88682861328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,16,power_law_1.01,0.10602240562438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,8,power_law_1.01,0.10842239856719971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,16,power_law_1.2,0.1020799994468689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,16,power_law_1.01,0.11379200220108032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,8,power_law_1.01,0.11804800033569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,16,power_law_1.2,0.10371840000152588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,16,power_law_1.01,0.11645439863204957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,8,power_law_1.01,0.1174015998840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,16,power_law_1.2,0.10045440196990967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,8,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,16,power_law_1.01,0.12156800031661988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,8,power_law_1.01,0.12665599584579468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,16,power_law_1.2,0.10229120254516602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,8,power_law_1.2,0.08266879916191101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,16,power_law_1.01,0.13489279747009278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,8,power_law_1.01,0.12398719787597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,16,power_law_1.2,0.112716805934906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,8,power_law_1.2,0.07838079929351807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,8,power_law_1.01,0.13749760389328003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,16,power_law_1.01,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,16,power_law_1.2,0.11784960031509399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,8,power_law_1.2,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,8,power_law_1.01,0.13566720485687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,16,power_law_1.01,0.179750394821167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,16,power_law_1.2,0.12541439533233642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,8,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,8,power_law_1.01,0.14425599575042725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,16,power_law_1.01,0.19304959774017333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,16,power_law_1.2,0.14364800453186036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,8,power_law_1.2,0.08309119939804077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,8,power_law_1.01,0.16227840185165404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,16,power_law_1.01,0.24241280555725098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,16,power_law_1.2,0.15082240104675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,8,power_law_1.2,0.0886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,8,power_law_1.01,0.18029439449310303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,16,power_law_1.01,0.28460159301757815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,16,power_law_1.2,0.18093440532684327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,8,power_law_1.2,0.09802240133285522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,8,power_law_1.01,0.21395199298858641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,16,power_law_1.01,0.3644799947738647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,16,power_law_1.2,0.20405759811401367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,8,power_law_1.2,0.11052160263061524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,8,power_law_1.01,0.23968639373779296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,16,power_law_1.01,0.45273599624633787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,16,power_law_1.2,0.24993278980255126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,8,power_law_1.2,0.10806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,8,power_law_1.01,0.28967039585113524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,16,power_law_1.01,0.6218751907348633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,16,power_law_1.2,0.2966464042663574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,8,power_law_1.2,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,8,power_law_1.01,0.33717119693756104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,16,power_law_1.01,0.8092927932739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,16,power_law_1.2,0.406828784942627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,8,power_law_1.2,0.11299200057983398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,8,power_law_1.01,0.45187840461730955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,16,power_law_1.01,1.047264003753662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,16,power_law_1.2,0.504691219329834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,8,power_law_1.2,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,8,power_law_1.01,0.5305215835571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,16,power_law_1.01,1.441919994354248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,16,power_law_1.2,0.6593408107757568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,8,power_law_1.2,0.1238592028617859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,8,power_law_1.01,0.7400320053100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,16,power_law_1.01,2.9041919708251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,8,power_law_1.2,0.13284480571746826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,16,power_law_1.2,0.9026368141174317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,8,power_law_1.01,1.0029824256896973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,8,power_law_1.2,0.13366400003433226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,16,power_law_1.2,1.1133695602416993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,8,power_law_1.01,1.1682496070861816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,8,power_law_1.2,0.15067520141601562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,16,power_law_1.2,1.6395200729370116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,8,power_law_1.01,1.7439615249633789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,8,power_law_1.2,0.16951040029525757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,4,power_law_1.01,0.08532480001449586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,8,power_law_1.2,0.1883455991744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,16,power_law_1.2,3.166489601135254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,8,power_law_1.01,3.4745151519775392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,4,power_law_1.01,0.08757759928703308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,8,power_law_1.2,0.21763839721679687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,4,power_law_1.01,0.10558079481124878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,8,power_law_1.2,0.23790080547332765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,8,power_law_1.2,0.307532811164856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,4,power_law_1.01,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,4,power_law_1.01,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,4,power_law_1.2,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,4,power_law_1.01,0.11276160478591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,4,power_law_1.2,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,4,power_law_1.01,0.12318079471588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,4,power_law_1.2,0.08221439719200134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,4,power_law_1.2,0.08076159954071045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,4,power_law_1.01,0.13794560432434083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,4,power_law_1.2,0.09225599765777588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,4,power_law_1.01,0.1486207962036133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,4,power_law_1.2,0.1110975980758667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,4,power_law_1.01,0.14922879934310912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,power_law_1.01,0.032441601157188416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,power_law_1.01,0.031219199299812317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,4,power_law_1.2,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,4,power_law_1.01,0.15443840026855468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,power_law_1.01,0.031411200761795044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,4,power_law_1.2,0.1356735944747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,4,power_law_1.01,0.1627519965171814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,power_law_1.01,0.03163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,power_law_1.01,0.03284479975700379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,4,power_law_1.2,0.1381119966506958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,4,power_law_1.01,0.1676543951034546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,power_law_1.01,0.04267520010471344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,4,power_law_1.2,0.14960000514984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,4,power_law_1.01,0.1699072003364563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,power_law_1.01,0.04493440091609955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,power_law_1.01,0.03346560001373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,4,power_law_1.2,0.1606592059135437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,4,power_law_1.01,0.19613440036773683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,power_law_1.01,0.03407999873161316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,4,power_law_1.2,0.16167680025100709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,4,power_law_1.01,0.19365760087966918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,power_law_1.01,0.03407360017299652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,4,power_law_1.2,0.1688447952270508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,4,power_law_1.01,0.2090303897857666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,4,power_law_1.2,0.1725376009941101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,4,power_law_1.01,0.2329792022705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,4,power_law_1.2,0.18050559759140014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,4,power_law_1.01,0.2556544065475464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,4,power_law_1.2,0.18810240030288697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,4,power_law_1.01,0.2987328052520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,4,power_law_1.2,0.20324480533599854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,4,power_law_1.01,0.32413439750671386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,4,power_law_1.2,0.23082880973815917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,4,power_law_1.01,0.40297598838806153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,4,power_law_1.2,0.26080639362335206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,4,power_law_1.01,0.4588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,4,power_law_1.2,0.3054464101791382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,4,power_law_1.01,0.6108543872833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,4,power_law_1.2,0.33924479484558107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,4,power_law_1.01,0.751955223083496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,4,power_law_1.2,0.4223936080932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,4,power_law_1.01,1.0548480033874512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,4,power_law_1.2,0.47031679153442385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,4,power_law_1.01,1.3362431526184082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,4,power_law_1.2,0.6177728176116943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,4,power_law_1.01,1.5744383811950684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,4,power_law_1.2,0.8055680274963379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,4,power_law_1.01,2.3878847122192384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,4,power_law_1.2,1.1034815788269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,4,power_law_1.2,1.4196928024291993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,4,power_law_1.01,4.800576019287109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,4,power_law_1.2,1.608723258972168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,4,power_law_1.2,2.482809638977051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,4,power_law_1.2,5.140371322631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,power_law_1.2,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,power_law_1.2,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,power_law_1.2,0.031046399474143983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,power_law_1.2,0.03139840066432953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,power_law_1.2,0.03160319924354553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,power_law_1.01,0.03368319869041443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,power_law_1.01,0.03163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,power_law_1.2,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,power_law_1.01,0.03080959916114807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,power_law_1.01,0.03162879943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,power_law_1.01,0.03245440125465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,power_law_1.2,0.036800000071525577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,power_law_1.2,0.03763200044631958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,power_law_1.01,0.044947201013565065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,power_law_1.2,0.03903999924659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,power_law_1.01,0.03326080143451691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,power_law_1.2,0.04805760085582733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,power_law_1.01,0.033478400111198424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,power_law_1.2,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,power_law_1.01,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,power_law_1.2,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,power_law_1.2,0.06444159746170045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,power_law_1.2,0.0677183985710144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,power_law_1.01,0.03675520122051239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,power_law_1.2,0.08963840007781983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,power_law_1.01,0.04350079894065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,power_law_1.2,0.1240447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,power_law_1.01,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,power_law_1.2,0.13713279962539673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,power_law_1.01,0.06071680188179016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,power_law_1.2,0.18833919763565063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,power_law_1.01,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,power_law_1.2,0.23279359340667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,power_law_1.2,0.3353919982910156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,power_law_1.2,0.43306879997253417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,power_law_1.01,0.1074112057685852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,power_law_1.2,0.5522496223449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,power_law_1.01,0.13566720485687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,power_law_1.2,0.8625408172607422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,power_law_1.01,0.1626431941986084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,power_law_1.2,1.7690111160278321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,power_law_1.01,0.22352640628814696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,power_law_1.01,0.3496896028518677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,power_law_1.01,0.40088958740234376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,power_law_1.01,0.5522304058074952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,power_law_1.01,1.038144016265869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,power_law_1.01,1.5808704376220704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,power_law_1.2,0.03187200129032135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,power_law_1.2,0.03025279939174652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,power_law_1.2,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,power_law_1.2,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,power_law_1.2,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,power_law_1.2,0.04048640131950378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,power_law_1.2,0.04204800128936768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,power_law_1.2,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,power_law_1.2,0.03310079872608185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,power_law_1.2,0.03386879861354828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,power_law_1.2,0.03452799916267395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,power_law_1.01,0.03777920007705689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,power_law_1.01,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,power_law_1.01,0.03632639944553375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,power_law_1.2,0.04273279905319214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,power_law_1.01,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,power_law_1.2,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,power_law_1.01,0.03797760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,power_law_1.01,0.03758080005645752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,power_law_1.2,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,power_law_1.01,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,power_law_1.2,0.09619839787483216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,power_law_1.01,0.040031999349594116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,power_law_1.2,0.09496319890022278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,power_law_1.01,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,power_law_1.2,0.12711039781570435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,power_law_1.01,0.04330880045890808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,power_law_1.2,0.14369920492172242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,power_law_1.01,0.044537600874900815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,power_law_1.2,0.24753279685974122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,power_law_1.2,0.25306239128112795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,power_law_1.01,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,power_law_1.2,0.3773632049560547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,power_law_1.2,0.47565441131591796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,power_law_1.01,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,power_law_1.2,0.570304012298584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,power_law_1.01,0.08078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,power_law_1.2,1.0851584434509278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,power_law_1.01,0.10208640098571778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,power_law_1.2,1.8345216751098632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,power_law_1.01,0.1336192011833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,power_law_1.01,0.1827712059020996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,power_law_1.01,0.20427520275115968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,power_law_1.01,0.2876287937164307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,power_law_1.01,0.34067840576171876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,power_law_1.01,0.4948927879333496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,power_law_1.01,0.6409088134765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,power_law_1.01,0.7818175792694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,8,power_law_1.2,0.35218560695648193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,power_law_1.01,1.2850111961364745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,8,power_law_1.2,0.47649922370910647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,power_law_1.01,2.7267776489257813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,8,power_law_1.2,0.5669568061828614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,8,power_law_1.2,0.7919680118560791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,8,power_law_1.2,1.0018112182617187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,8,power_law_1.2,1.3034751892089844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,8,power_law_1.2,2.0985151290893556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,power_law_1.2,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,power_law_1.2,0.03741439878940582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,8,power_law_1.2,3.949504089355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,power_law_1.2,0.03802880048751831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,power_law_1.2,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,power_law_1.2,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,power_law_1.2,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,power_law_1.2,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,power_law_1.01,0.04002560079097748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,power_law_1.01,0.03919999897480011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,power_law_1.2,0.043136000633239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,power_law_1.01,0.03470079898834229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,power_law_1.2,0.046828800439834596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,power_law_1.01,0.03429119884967804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,power_law_1.01,0.052102398872375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,power_law_1.01,0.05249919891357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,power_law_1.01,0.035724800825119016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,power_law_1.2,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,power_law_1.01,0.06806399822235107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,power_law_1.01,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,power_law_1.2,0.09208319783210754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,power_law_1.01,0.03656319975852966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,power_law_1.2,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,power_law_1.01,0.10450559854507446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,power_law_1.2,0.09823359847068787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,power_law_1.01,0.03777920007705689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,power_law_1.01,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,power_law_1.01,0.03797119855880737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,power_law_1.2,0.14082560539245606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,power_law_1.01,0.10782719850540161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,power_law_1.2,0.03311359882354736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,power_law_1.01,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,power_law_1.2,0.18364160060882567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,power_law_1.01,0.12376960515975952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,power_law_1.2,0.03372800052165985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,power_law_1.2,0.1975551962852478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,power_law_1.01,0.19567359685897828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,power_law_1.01,0.04289920032024384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,power_law_1.2,0.035571199655532834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,power_law_1.2,0.2874752044677734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,power_law_1.01,0.19342080354690552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,power_law_1.01,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,power_law_1.2,0.034534400701522826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,power_law_1.2,0.35422720909118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,power_law_1.01,0.34025599956512453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,power_law_1.01,0.05251839756965637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,power_law_1.2,0.035359999537467955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,power_law_1.2,0.49738240242004395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,power_law_1.01,0.44408321380615234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,power_law_1.01,0.05948160290718078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,power_law_1.2,0.6001920223236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,power_law_1.01,0.5481344223022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,power_law_1.01,0.06419839859008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,power_law_1.2,0.037625598907470706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,power_law_1.2,0.8527039527893067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,power_law_1.01,0.8756095886230468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,power_law_1.01,0.08220160007476807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,power_law_1.2,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,power_law_1.2,1.2936448097229003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,power_law_1.01,0.07544320225715637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,power_law_1.01,1.6964351654052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,power_law_1.01,0.09571200013160705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,power_law_1.2,2.3805120468139647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,power_law_1.01,0.1213312029838562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,power_law_1.01,0.1485759973526001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,power_law_1.2,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,power_law_1.01,0.18481919765472413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,power_law_1.2,0.04479359984397888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,power_law_1.01,0.258950400352478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,power_law_1.2,0.053600001335144046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,power_law_1.01,0.3398591995239258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,power_law_1.2,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,power_law_1.01,0.43057918548583984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,power_law_1.2,0.06567680239677429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,power_law_1.01,0.5509823799133301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,power_law_1.2,0.08102399706840516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,power_law_1.01,0.770739221572876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,power_law_1.2,0.08349440097808838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,power_law_1.2,0.09679999947547913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,power_law_1.01,1.1387776374816894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,power_law_1.2,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,power_law_1.01,2.649990463256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,power_law_1.2,0.1477311968803406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,power_law_1.2,0.17893120050430297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,power_law_1.2,0.21967999935150145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,power_law_1.2,0.29217278957366943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,power_law_1.01,0.16412800550460815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,power_law_1.2,0.46953601837158204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,power_law_1.2,0.16376320123672486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,power_law_1.01,0.14999040365219116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,power_law_1.2,0.6868224143981934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,power_law_1.2,0.14882559776306153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,power_law_1.01,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,power_law_1.2,0.8072511672973632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,power_law_1.01,0.08650879859924317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,power_law_1.2,1.2776703834533691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,power_law_1.2,0.09535999894142151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,power_law_1.01,0.091839998960495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,power_law_1.2,3.0819583892822267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,power_law_1.2,0.08798720240592957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,power_law_1.01,0.08015999794006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,power_law_1.01,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,power_law_1.2,0.0798143982887268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,power_law_1.01,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,power_law_1.2,0.08490880131721497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,power_law_1.01,0.08161280155181885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,power_law_1.01,0.14958080053329467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,power_law_1.2,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,power_law_1.01,0.08384640216827392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,power_law_1.01,0.08980479836463928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,power_law_1.2,0.08654720187187195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,power_law_1.01,0.08936960101127625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,power_law_1.01,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,power_law_1.2,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,power_law_1.01,0.09080960154533387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,power_law_1.01,0.06111999750137329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,power_law_1.2,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,power_law_1.01,0.09019520282745361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,power_law_1.01,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,power_law_1.2,0.09106559753417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,power_law_1.01,0.08977919816970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,power_law_1.01,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,power_law_1.2,0.09373440146446228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,power_law_1.01,0.09490560293197632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,power_law_1.01,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,power_law_1.2,0.10190720558166504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,power_law_1.01,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,power_law_1.2,0.15353599786758423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,power_law_1.01,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,power_law_1.2,0.10683519840240478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,power_law_1.01,0.10945279598236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,power_law_1.2,0.08533759713172913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,power_law_1.01,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,power_law_1.2,0.12035839557647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,power_law_1.01,0.1278656005859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,power_law_1.01,0.08037760257720947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,power_law_1.2,0.13816959857940675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,power_law_1.01,0.1274623990058899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,power_law_1.2,0.06033920049667359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,power_law_1.01,0.0838591992855072
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,power_law_1.2,0.14124799966812135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,power_law_1.01,0.15286400318145751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,power_law_1.01,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,power_law_1.2,0.1848512053489685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,power_law_1.01,0.16780799627304077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,power_law_1.2,0.06873599886894226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,power_law_1.2,0.18302079439163207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,power_law_1.01,0.22556159496307374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,power_law_1.2,0.07550719976425171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,power_law_1.01,0.08774399757385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,power_law_1.2,0.2602175951004028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,power_law_1.01,0.2677567958831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,power_law_1.2,0.07715200185775757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,power_law_1.01,0.09715840220451355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,power_law_1.2,0.3190079927444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,power_law_1.01,0.3228480100631714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,power_law_1.01,0.10207359790802002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,power_law_1.2,0.4609344005584717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,power_law_1.2,0.07735679745674133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,power_law_1.01,0.10739840269088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,power_law_1.01,0.4887296199798584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,power_law_1.2,0.6458752155303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,power_law_1.01,0.11681920289993286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,power_law_1.2,0.08206080198287964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,power_law_1.01,0.6818560123443603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,power_law_1.2,0.9903424263000489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,power_law_1.2,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,power_law_1.01,0.12174079418182374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,power_law_1.01,0.80513916015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,power_law_1.2,1.1928895950317382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,power_law_1.2,0.08228480219841003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,power_law_1.01,0.14365439414978026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,power_law_1.01,1.0066752433776855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,power_law_1.2,1.6149696350097655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,power_law_1.2,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,power_law_1.01,0.15389440059661866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,power_law_1.01,1.5067904472351075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,power_law_1.2,2.832076835632324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,power_law_1.2,0.10232319831848144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,power_law_1.01,0.20571520328521728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,power_law_1.2,0.10192639827728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,power_law_1.01,0.23395841121673583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,power_law_1.01,3.0495424270629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,power_law_1.2,6.10582389831543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,power_law_1.2,0.10438400506973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,power_law_1.01,0.3115904092788696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,power_law_1.2,0.12465280294418335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,power_law_1.01,0.38675200939178467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,power_law_1.2,0.13530880212783813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,power_law_1.01,0.5464896202087403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,power_law_1.2,0.19756799936294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,power_law_1.01,0.7273471832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,power_law_1.2,0.17585920095443724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,power_law_1.01,0.8625023841857911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,power_law_1.2,0.23813118934631347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,power_law_1.01,1.3054719924926759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,power_law_1.2,0.2624768018722534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,power_law_1.01,2.690540885925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,power_law_1.2,0.3546560049057007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,power_law_1.2,0.4494016170501709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,power_law_1.2,0.7200064182281494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,power_law_1.2,0.8920448303222657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,power_law_1.01,0.10964479446411132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,power_law_1.2,0.09413759708404541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,power_law_1.2,1.2146112442016601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,power_law_1.01,0.10658559799194336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,power_law_1.2,0.10231679677963257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,power_law_1.2,1.7444032669067382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,power_law_1.01,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,power_law_1.2,0.05113599896430969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,power_law_1.01,0.06152960062026978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,power_law_1.2,3.931468963623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,power_law_1.01,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,power_law_1.2,0.061977601051330565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,power_law_1.2,0.06627200245857238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,power_law_1.2,0.07591040134429931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,power_law_1.01,0.07544959783554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,power_law_1.2,0.07898880243301391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,power_law_1.01,0.07996159791946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,power_law_1.2,0.07919999957084656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,power_law_1.01,0.09696000218391418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,power_law_1.2,0.08062719702720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,power_law_1.2,0.08327040076255798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,power_law_1.2,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,power_law_1.01,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,power_law_1.2,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,power_law_1.01,0.06929919719696045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,power_law_1.2,0.08799999952316284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,power_law_1.01,0.07914239764213563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,power_law_1.2,0.09290239810943604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,power_law_1.01,0.07934719920158387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,power_law_1.2,0.10191359519958496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,power_law_1.01,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,power_law_1.2,0.10765440464019775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,power_law_1.2,0.09168639779090881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,power_law_1.01,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,power_law_1.2,0.11725440025329589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,power_law_1.2,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,power_law_1.01,0.08549759984016418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,power_law_1.2,0.12363519668579101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,power_law_1.2,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,power_law_1.2,0.1498304009437561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,power_law_1.2,0.16785279512405396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,power_law_1.2,0.06813439726829529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,power_law_1.2,0.2065727949142456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,power_law_1.2,0.07694720029830933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,power_law_1.01,0.09449599981307984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,power_law_1.2,0.24487679004669188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,power_law_1.2,0.0787775993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,power_law_1.01,0.09879680275917054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,power_law_1.2,0.3566783905029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,power_law_1.01,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,power_law_1.2,0.07836800217628478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,power_law_1.2,0.4103424072265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,power_law_1.01,0.1205183982849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,power_law_1.2,0.08288639783859253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,power_law_1.2,0.6548799991607666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,power_law_1.01,0.13341439962387086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,power_law_1.2,0.08697599768638611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,power_law_1.2,0.8322303771972657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,power_law_1.01,0.15163520574569703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,power_law_1.2,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,power_law_1.2,0.996070384979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,power_law_1.01,0.17007999420166015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,power_law_1.2,0.09106559753417968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,power_law_1.01,0.2085632085800171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,power_law_1.2,1.5490240097045898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,power_law_1.2,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,power_law_1.01,0.25179519653320315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,power_law_1.2,0.09822720289230347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,power_law_1.2,3.294355010986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,power_law_1.01,0.3261375904083252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,power_law_1.2,0.1076416015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,power_law_1.01,0.4232128143310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,power_law_1.2,0.12343039512634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,power_law_1.2,0.13100800514221192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,power_law_1.01,0.5534592151641846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,power_law_1.2,0.16396160125732423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,power_law_1.01,0.6888319969177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,power_law_1.2,0.17503999471664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,power_law_1.01,0.8760255813598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,power_law_1.2,0.21845760345458984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,power_law_1.01,1.4009087562561036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,power_law_1.2,0.2622720003128052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,power_law_1.01,2.6520383834838865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,power_law_1.2,0.3259711980819702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,power_law_1.2,0.4380032062530518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,power_law_1.2,0.6409599781036377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,power_law_1.2,0.7925119876861573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,power_law_1.2,1.0529472351074218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,power_law_1.2,1.4773568153381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,power_law_1.01,0.05911039710044861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,power_law_1.2,3.290662384033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,power_law_1.01,0.055827200412750244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,power_law_1.01,0.058905601501464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,power_law_1.01,0.06382719874382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,power_law_1.01,0.07264000177383423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,power_law_1.01,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,power_law_1.01,0.08183680176734924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,power_law_1.01,0.08367999792098998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,power_law_1.2,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,power_law_1.01,0.08595200181007386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,power_law_1.2,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,power_law_1.01,0.08881279826164246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,power_law_1.01,0.08921599984169007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,power_law_1.2,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,power_law_1.01,0.09105280041694641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,power_law_1.2,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,power_law_1.01,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,power_law_1.2,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,power_law_1.2,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,power_law_1.01,0.09946240186691284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,power_law_1.2,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,power_law_1.01,0.1023360013961792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,power_law_1.2,0.08139520287513732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,power_law_1.2,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,power_law_1.01,0.1318079948425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,power_law_1.2,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,power_law_1.01,0.14287359714508058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,power_law_1.01,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,power_law_1.2,0.08713600039482117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,power_law_1.01,0.16475520133972169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,power_law_1.01,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,power_law_1.2,0.0906175971031189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,power_law_1.01,0.1948799967765808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,power_law_1.01,0.055238401889801024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,power_law_1.01,0.2452608108520508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,power_law_1.2,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,power_law_1.01,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,power_law_1.2,0.09552000164985656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,power_law_1.01,0.2964799880981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,power_law_1.2,0.10126080513000488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,power_law_1.01,0.37489919662475585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,power_law_1.2,0.10699520111083985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,power_law_1.01,0.07305600047111512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,power_law_1.01,0.44700798988342283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,power_law_1.2,0.11703039407730102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,power_law_1.01,0.6329792022705079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,power_law_1.2,0.13014400005340576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,power_law_1.01,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,power_law_1.01,0.8228032112121582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,power_law_1.2,0.15497599840164183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,power_law_1.01,0.09042559862136841
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,power_law_1.01,0.9649472236633301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,power_law_1.2,0.18339200019836427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,power_law_1.01,0.09331200122833253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,power_law_1.01,1.4933247566223145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,power_law_1.2,0.20446720123291015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,power_law_1.01,0.09598079919815064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,power_law_1.2,0.2536384105682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,power_law_1.01,2.93450870513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,power_law_1.01,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,power_law_1.2,0.3283776044845581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,power_law_1.01,0.10279680490493774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,power_law_1.01,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,power_law_1.2,0.42278399467468264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,power_law_1.01,0.11277439594268798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,power_law_1.2,0.5509952068328857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,power_law_1.01,0.11932799816131592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,power_law_1.2,0.7207871913909912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,power_law_1.01,0.1256767988204956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,power_law_1.2,0.8681728363037109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,power_law_1.01,0.146560001373291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,power_law_1.2,1.1477760314941405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,power_law_1.01,0.1666432023048401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,power_law_1.2,1.6034559249877929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,power_law_1.01,0.20760960578918458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,power_law_1.01,0.23955199718475342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,power_law_1.2,3.3069950103759767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,power_law_1.01,0.31921279430389404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,power_law_1.01,0.3759488105773926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,power_law_1.01,0.5055552005767823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,power_law_1.01,0.6409599781036377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,power_law_1.01,0.8972991943359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,power_law_1.01,1.0556672096252442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,power_law_1.01,1.3390527725219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,power_law_1.2,0.05829120278358459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,power_law_1.01,2.131692886352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,power_law_1.01,0.0361407995223999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,power_law_1.2,0.061964797973632815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,power_law_1.01,4.127052688598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,power_law_1.2,0.060127997398376466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,power_law_1.01,0.03633280098438263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,power_law_1.2,0.06547840237617493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,power_law_1.01,0.036339199542999266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,power_law_1.2,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,power_law_1.01,0.040031999349594116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,power_law_1.2,0.08533120155334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,power_law_1.2,0.08778240084648133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,power_law_1.01,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,power_law_1.01,0.04678399860858917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,power_law_1.2,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,power_law_1.01,0.04780800044536591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,power_law_1.2,0.09246079921722412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,power_law_1.01,0.052300798892974856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,power_law_1.2,0.0980288028717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,power_law_1.01,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,power_law_1.2,0.033939200639724734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,power_law_1.2,0.09946240186691284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,power_law_1.01,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,power_law_1.2,0.034944000840187076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,power_law_1.2,0.1029312014579773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,power_law_1.01,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,power_law_1.2,0.033939200639724734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,power_law_1.2,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,power_law_1.01,0.047814399003982544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,power_law_1.2,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,power_law_1.2,0.11665920019149781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,power_law_1.01,0.05211520195007324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,power_law_1.2,0.035359999537467955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,power_law_1.01,0.07954559922218322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,power_law_1.01,0.05374720096588135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,power_law_1.2,0.11911040544509888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,power_law_1.01,0.06521599888801574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,power_law_1.01,0.08118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,power_law_1.2,0.1295680046081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,power_law_1.01,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,power_law_1.2,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,power_law_1.2,0.149017596244812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,power_law_1.01,0.09757440090179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,power_law_1.2,0.04642559885978699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,power_law_1.2,0.1691007971763611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,power_law_1.01,0.09777920246124268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,power_law_1.2,0.047251200675964354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,power_law_1.01,0.08630399703979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,power_law_1.2,0.2100543975830078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,power_law_1.01,0.12379519939422608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,power_law_1.2,0.054176002740859985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,power_law_1.01,0.08691840171813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,power_law_1.2,0.24895360469818115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,power_law_1.01,0.13690240383148194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,power_law_1.2,0.055251199007034305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,power_law_1.2,0.31429119110107423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,power_law_1.01,0.2077631950378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,power_law_1.2,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,power_law_1.01,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,power_law_1.01,0.24379520416259765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,power_law_1.2,0.40132479667663573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,power_law_1.01,0.09756159782409668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,power_law_1.01,0.37876479625701903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,power_law_1.2,0.05011839866638183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,power_law_1.2,0.5150015830993653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,power_law_1.01,0.10677759647369385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,power_law_1.2,0.05381119847297668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,power_law_1.01,0.4191103935241699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,power_law_1.2,0.6860159873962403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,power_law_1.2,0.06097279787063599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,power_law_1.01,0.11538560390472412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,power_law_1.01,0.5145279884338378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,power_law_1.2,0.9329855918884278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,power_law_1.2,0.07283200025558471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,power_law_1.01,0.11968640089035035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,power_law_1.01,1.0427519798278808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,power_law_1.2,1.136774444580078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,power_law_1.2,0.07756159901618957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,power_law_1.01,0.1389248013496399
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,power_law_1.01,1.9555135726928712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,power_law_1.2,1.4259519577026367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,power_law_1.2,0.09824640154838563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,power_law_1.01,0.15532159805297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,power_law_1.2,0.12199039459228515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,power_law_1.2,2.3887039184570313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,power_law_1.01,0.19586559534072875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,power_law_1.2,0.16807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,power_law_1.01,0.22433919906616212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,power_law_1.2,0.21989760398864747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,power_law_1.2,4.532345581054687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,power_law_1.01,0.2941632032394409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,power_law_1.2,0.3513727903366089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,power_law_1.01,0.3754944086074829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,power_law_1.2,0.37592320442199706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,power_law_1.2,0.5666111946105957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,power_law_1.01,0.47643518447875977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,power_law_1.2,0.6802688121795655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,power_law_1.01,0.6929215908050537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,power_law_1.2,0.8670528411865235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,power_law_1.01,0.8629119873046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,power_law_1.2,1.4210304260253905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,power_law_1.01,0.03324800133705139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,power_law_1.01,1.2415679931640624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,power_law_1.01,0.033062401413917544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,power_law_1.2,2.7669824600219726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,power_law_1.01,2.4087295532226562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,power_law_1.01,0.03328000009059906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,power_law_1.01,0.033267199993133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,power_law_1.2,0.031673601269721983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,power_law_1.01,0.03366400003433227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,power_law_1.2,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,power_law_1.01,0.03450239896774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,power_law_1.01,0.039827200770378116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,power_law_1.2,0.032902398705482484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,power_law_1.2,0.033318400382995605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,power_law_1.01,0.044537600874900815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,power_law_1.01,0.04760960042476654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,power_law_1.2,0.0398719996213913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,power_law_1.01,0.05272960066795349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,power_law_1.2,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,power_law_1.01,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,power_law_1.2,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,power_law_1.01,0.033497598767280576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,power_law_1.2,0.03407360017299652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,power_law_1.01,0.04166400134563446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,power_law_1.2,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,power_law_1.01,0.03167999982833862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,power_law_1.2,0.031001600623130798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,power_law_1.01,0.044940799474716187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,power_law_1.2,0.054611200094223024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,power_law_1.01,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,power_law_1.2,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,power_law_1.01,0.045561599731445315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,power_law_1.2,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,power_law_1.01,0.030457600951194763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,power_law_1.2,0.03142400085926056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,power_law_1.2,0.0318336009979248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,power_law_1.2,0.045388799905776975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,power_law_1.2,0.03407999873161316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,power_law_1.2,0.047244799137115476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,power_law_1.2,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,power_law_1.2,0.07386879920959473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,power_law_1.2,0.045952001214027406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,power_law_1.2,0.09578239917755127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,power_law_1.2,0.12158080339431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,power_law_1.2,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,power_law_1.2,0.05292159914970398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,power_law_1.2,0.15189119577407836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,power_law_1.2,0.05394560098648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,power_law_1.2,0.16418559551239015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,power_law_1.2,0.040428799390792844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,power_law_1.2,0.22479360103607177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,power_law_1.2,0.04596480131149292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,power_law_1.2,0.24978559017181395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,power_law_1.2,0.04799999892711639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,power_law_1.2,0.44864640235900877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,power_law_1.2,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,power_law_1.2,0.6014272212982178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,power_law_1.2,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,power_law_1.2,0.7867712020874024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,power_law_1.2,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,power_law_1.2,1.2637439727783204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,power_law_1.2,0.08588799834251404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,power_law_1.2,0.10985599756240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,power_law_1.2,2.8501312255859377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,power_law_1.2,0.13320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,power_law_1.2,0.1356608033180237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,power_law_1.2,0.1733440041542053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,power_law_1.2,0.25077760219573975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,power_law_1.2,0.48258562088012696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,power_law_1.2,0.45800957679748533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,power_law_1.2,0.5247807979583741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,power_law_1.2,1.0024959564208984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,power_law_1.2,2.1027584075927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,power_law_1.01,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,power_law_1.01,0.032492798566818235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,power_law_1.01,0.029824000597000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,power_law_1.01,0.03227519989013672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,power_law_1.01,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,power_law_1.01,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,power_law_1.01,0.033529600501060484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,power_law_1.01,0.04085760116577149
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,power_law_1.01,0.04334079921245575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,power_law_1.01,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,power_law_1.2,0.034892800450325015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,power_law_1.2,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,power_law_1.2,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,power_law_1.2,0.03162240087985992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,power_law_1.2,0.03325439989566803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,power_law_1.2,0.034694400429725644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,power_law_1.2,0.035097599029541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,power_law_1.2,0.040217599272727965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,power_law_1.2,0.04350079894065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,power_law_1.2,0.045542401075363156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,power_law_1.2,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,power_law_1.2,0.053939199447631835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,power_law_1.2,0.05538560152053833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,power_law_1.2,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,power_law_1.2,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,power_law_1.2,0.04759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,power_law_1.2,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,power_law_1.2,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,power_law_1.2,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,power_law_1.2,0.13299839496612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,power_law_1.2,0.14016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,power_law_1.2,0.19155839681625367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,power_law_1.2,0.24768640995025634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,power_law_1.2,0.36113920211791994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,power_law_1.2,0.5112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,power_law_1.2,0.7027520179748535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,power_law_1.2,0.9808575630187988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,power_law_1.2,2.090265655517578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,power_law_1.01,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,power_law_1.01,0.03163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,power_law_1.01,0.031615999341011045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,power_law_1.01,0.03408640027046204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,power_law_1.01,0.036934399604797365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,power_law_1.01,0.037350401282310486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,power_law_1.01,0.03919360041618347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,power_law_1.01,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,power_law_1.01,0.03979519903659821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,power_law_1.01,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,power_law_1.01,0.040428799390792844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,power_law_1.01,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,power_law_1.01,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,power_law_1.01,0.04678399860858917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,power_law_1.01,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,power_law_1.01,0.05496960282325745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,power_law_1.01,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,power_law_1.01,0.0705344021320343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,power_law_1.01,0.08733440041542054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,power_law_1.01,0.09879040122032165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,power_law_1.01,0.129094398021698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,power_law_1.01,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,power_law_1.01,0.21452159881591798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,power_law_1.01,0.2603840112686157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,power_law_1.01,0.3398400068283081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,power_law_1.01,0.44940800666809083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,power_law_1.01,0.5223231792449952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,power_law_1.01,0.9149184226989746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,power_law_1.01,1.7021696090698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,power_law_1.01,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,power_law_1.01,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,power_law_1.2,0.03612799942493439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,power_law_1.01,0.06665599942207337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,power_law_1.01,0.03516159951686859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,power_law_1.2,0.03141759932041168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,power_law_1.01,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,power_law_1.2,0.03160319924354553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,power_law_1.01,0.09921280145645142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,power_law_1.01,0.04314880073070526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,power_law_1.2,0.0328575998544693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,power_law_1.01,0.043558400869369504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,power_law_1.01,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,power_law_1.2,0.03429119884967804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,power_law_1.01,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,power_law_1.01,0.12440320253372192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,power_law_1.2,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,power_law_1.01,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,power_law_1.2,0.038150399923324585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,power_law_1.01,0.1725376009941101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,power_law_1.01,0.05318400263786316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,power_law_1.01,0.1856384038925171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,power_law_1.01,0.03904640078544617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,power_law_1.2,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,power_law_1.01,0.2876159906387329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,power_law_1.2,0.03940480053424835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,power_law_1.01,0.3486464023590088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,power_law_1.01,0.04540160000324249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,power_law_1.2,0.03960959911346436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,power_law_1.01,0.45513601303100587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,power_law_1.2,0.04099839925765991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,power_law_1.01,0.6826752185821533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,power_law_1.01,0.052339202165603636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,power_law_1.2,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,power_law_1.01,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,power_law_1.2,0.04472959935665131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,power_law_1.01,1.433676815032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,power_law_1.01,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,power_law_1.2,0.04840959906578064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,power_law_1.01,0.09107840061187744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,power_law_1.2,0.051481598615646364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,power_law_1.01,0.1283455967903137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,power_law_1.2,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,power_law_1.01,0.11626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,power_law_1.2,0.06273279786109924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,power_law_1.01,0.16376960277557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,power_law_1.2,0.07871999740600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,power_law_1.2,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,power_law_1.01,0.19367040395736695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,power_law_1.2,0.10699520111083985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,power_law_1.01,0.25388801097869873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,power_law_1.2,0.13482880592346191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,power_law_1.01,0.3261823892593384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,power_law_1.2,0.17866239547729493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,power_law_1.01,0.4466047763824463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,power_law_1.2,0.28433918952941895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,power_law_1.01,0.6434175968170166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,power_law_1.2,0.28107519149780275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,power_law_1.01,1.1887935638427733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,power_law_1.2,0.4133440017700195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,power_law_1.2,0.5173952102661132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,power_law_1.01,0.03407999873161316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,power_law_1.2,0.6908671855926514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,power_law_1.01,0.03368319869041443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,power_law_1.2,1.071174430847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,power_law_1.01,0.03552640080451965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,power_law_1.2,2.2004480361938477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,power_law_1.01,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,power_law_1.01,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,power_law_1.01,0.04351359903812409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,power_law_1.01,0.04535680115222931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,power_law_1.01,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,power_law_1.01,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,power_law_1.2,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,power_law_1.01,0.04863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,power_law_1.01,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,power_law_1.2,0.03086079955101013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,power_law_1.01,0.05375360250473023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,power_law_1.01,0.04559360146522522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,power_law_1.2,0.033318400382995605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,power_law_1.2,0.033318400382995605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,power_law_1.01,0.06071680188179016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,power_law_1.01,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,power_law_1.2,0.03557760119438171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,power_law_1.01,0.07279360294342041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,power_law_1.01,0.06321920156478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,power_law_1.01,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,power_law_1.01,0.0834496021270752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,power_law_1.01,0.07754240036010743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,power_law_1.2,0.042131200432777405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,power_law_1.01,0.076883202791214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,power_law_1.01,0.10556800365447998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,power_law_1.01,0.08533120155334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,power_law_1.2,0.04110080003738403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,power_law_1.01,0.06377599835395813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,power_law_1.01,0.11518720388412476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,power_law_1.01,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,power_law_1.2,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,power_law_1.01,0.05783039927482605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,power_law_1.01,0.16311039924621581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,power_law_1.01,0.13694080114364623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,power_law_1.2,0.04276480078697205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,power_law_1.01,0.06314880251884461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,power_law_1.01,0.20039041042327882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,power_law_1.2,0.04356479942798615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,power_law_1.01,0.18097280263900756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,power_law_1.01,0.063155198097229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,power_law_1.01,0.2657023906707764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,power_law_1.2,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,power_law_1.01,0.2028736114501953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,power_law_1.01,0.06663680076599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,power_law_1.01,0.3380160093307495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,power_law_1.2,0.044377601146698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,power_law_1.01,0.30303359031677246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,power_law_1.01,0.0662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,power_law_1.01,0.47399039268493653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,power_law_1.2,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,power_law_1.01,0.06890239715576171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,power_law_1.01,0.3407167911529541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,power_law_1.01,0.6071231842041016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,power_law_1.2,0.053395199775695804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,power_law_1.01,0.07114239931106567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,power_law_1.01,0.46390399932861326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,power_law_1.2,0.055641597509384154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,power_law_1.01,0.7523071765899658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,power_law_1.01,0.770796823501587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,power_law_1.2,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,power_law_1.01,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,power_law_1.01,1.0969856262207032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,power_law_1.2,0.07326080203056336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,power_law_1.01,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,power_law_1.01,1.565004825592041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,power_law_1.01,2.2328128814697266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,power_law_1.2,0.08902400135993957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,power_law_1.01,0.07912319898605347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,power_law_1.2,0.1072383999824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,power_law_1.01,0.08506879806518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,power_law_1.2,0.13408000469207765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,power_law_1.01,0.08670719861984252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,power_law_1.2,0.17893120050430297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,power_law_1.01,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,power_law_1.2,0.2213184118270874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,power_law_1.01,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,power_law_1.2,0.2954623937606812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,power_law_1.01,0.11109119653701782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,power_law_1.2,0.3710207939147949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,power_law_1.01,0.1393407940864563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,power_law_1.2,0.5494016170501709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,power_law_1.01,0.14139519929885863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,power_law_1.01,0.18645119667053223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,power_law_1.01,0.21327359676361085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,power_law_1.01,0.2632575988769531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,power_law_1.01,0.3445631980895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,power_law_1.2,0.07057920098304749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,power_law_1.01,0.4756351947784424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,power_law_1.01,0.07402240037918091
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,power_law_1.2,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,power_law_1.01,0.5943871974945069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,power_law_1.01,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,power_law_1.01,0.7670464038848877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,power_law_1.01,0.06275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,power_law_1.2,0.05678079724311828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,power_law_1.01,1.371001625061035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,power_law_1.01,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,power_law_1.2,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,power_law_1.01,0.058873599767684935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,power_law_1.2,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,power_law_1.01,2.5148223876953124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,power_law_1.01,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,power_law_1.2,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,power_law_1.01,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,power_law_1.2,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,power_law_1.2,0.06872959733009339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,power_law_1.01,0.06911360025405884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,power_law_1.2,0.070387202501297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,power_law_1.01,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,power_law_1.01,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,power_law_1.2,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,power_law_1.01,0.07505279779434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,power_law_1.2,0.07692800164222717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,power_law_1.2,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,power_law_1.2,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,power_law_1.2,0.11953920125961304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,power_law_1.2,0.13565440177917482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,power_law_1.2,0.1686784029006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,power_law_1.2,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,power_law_1.2,0.15843839645385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,power_law_1.2,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,power_law_1.2,0.21415040493011475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,power_law_1.2,0.2499903917312622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,power_law_1.2,0.05741440057754517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,power_law_1.2,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,power_law_1.2,0.3414655923843384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,power_law_1.2,0.0651968002319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,power_law_1.2,0.4658495903015137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,power_law_1.2,0.06418560147285461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,power_law_1.2,0.575596809387207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,power_law_1.2,0.0664192020893097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,power_law_1.2,0.8739775657653809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,power_law_1.2,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,power_law_1.2,1.243667221069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,power_law_1.2,0.07196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,power_law_1.2,1.8828544616699219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,power_law_1.2,0.07504000067710877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,power_law_1.2,0.07626240253448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,power_law_1.2,3.559968185424805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,power_law_1.2,0.07811840176582337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,power_law_1.2,0.08124160170555114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,power_law_1.2,0.08651520013809204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,power_law_1.2,0.08856319785118102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,power_law_1.2,0.09632639884948731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,power_law_1.2,0.10903680324554443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,power_law_1.2,0.1201024055480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,power_law_1.2,0.14795520305633544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,power_law_1.2,0.15402239561080933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,power_law_1.2,0.196288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,power_law_1.2,0.2567039966583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,power_law_1.2,0.31445119380950926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,power_law_1.2,0.43999361991882324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,power_law_1.2,0.6337279796600341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,power_law_1.2,0.9325311660766602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,power_law_1.2,1.1133760452270507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,power_law_1.01,0.04947839975357056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,power_law_1.2,1.4476096153259277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,power_law_1.01,0.05685120224952698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,power_law_1.2,4.256447982788086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,power_law_1.01,0.0660863995552063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,power_law_1.01,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,power_law_1.01,0.07080320119857789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,power_law_1.01,0.0723583996295929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,power_law_1.01,0.07317759990692138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,power_law_1.01,0.0770687997341156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,power_law_1.01,0.08123520016670227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,power_law_1.01,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,power_law_1.01,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,power_law_1.01,0.09781759977340698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,power_law_1.01,0.11829119920730591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,power_law_1.01,0.12935680150985718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,power_law_1.01,0.15557760000228882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,power_law_1.01,0.1699136018753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,power_law_1.2,0.048204800486564635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,power_law_1.01,0.2067903995513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,power_law_1.2,0.049235200881958006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,power_law_1.01,0.25960960388183596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,power_law_1.2,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,power_law_1.01,0.36440320014953614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,power_law_1.2,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,power_law_1.01,0.43267202377319336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,power_law_1.2,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,power_law_1.01,0.5879104137420654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,power_law_1.2,0.06807680130004883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,power_law_1.01,0.7597248077392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,power_law_1.2,0.06991999745368957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,power_law_1.01,0.966163158416748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,power_law_1.2,0.07257599830627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,power_law_1.01,1.3989312171936035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,power_law_1.2,0.07258880138397217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,power_law_1.2,0.07934079766273498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,power_law_1.01,2.694675254821777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,power_law_1.2,0.08179200291633607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,power_law_1.2,0.08158720135688782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,power_law_1.2,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,power_law_1.2,0.08958079814910888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,power_law_1.2,0.09572479724884034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,power_law_1.2,0.10615040063858032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,power_law_1.2,0.12378239631652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,power_law_1.2,0.1340224027633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,power_law_1.2,0.165555202960968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,power_law_1.2,0.1793984055519104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,power_law_1.2,0.23764479160308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,power_law_1.2,0.30256640911102295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,power_law_1.2,0.36871678829193116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,power_law_1.2,0.5104447841644287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,power_law_1.2,0.7822080135345459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,power_law_1.2,0.874783992767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,power_law_1.2,1.260422420501709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,power_law_1.2,1.9534591674804687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,power_law_1.01,0.05562880039215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,power_law_1.2,3.448691177368164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,power_law_1.01,0.0498879998922348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,power_law_1.01,0.058483201265335086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,power_law_1.01,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,power_law_1.01,0.07878400087356567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,power_law_1.01,0.07938560247421264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,power_law_1.01,0.08164479732513427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,power_law_1.01,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,power_law_1.01,0.08594560027122497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,power_law_1.01,0.09140480160713196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,power_law_1.01,0.092467200756073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,power_law_1.01,0.09700480103492737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,power_law_1.01,0.10635520219802856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,power_law_1.01,0.10970879793167114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,power_law_1.01,0.11543040275573731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,power_law_1.2,0.6210944175720214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,power_law_1.01,0.13468799591064454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,power_law_1.2,0.8629568099975586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,power_law_1.01,0.14615679979324342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,power_law_1.2,1.450937557220459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,power_law_1.01,0.1899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,power_law_1.01,0.21946239471435547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,power_law_1.2,2.719264030456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,power_law_1.2,0.056595200300216676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,power_law_1.01,0.2825536012649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,power_law_1.2,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,power_law_1.01,0.31306240558624265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,power_law_1.2,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,power_law_1.01,0.44043521881103515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,power_law_1.2,0.05783039927482605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,power_law_1.01,0.5449024200439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,power_law_1.2,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,power_law_1.01,0.7785855770111084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,power_law_1.2,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,power_law_1.01,1.0556672096252442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,power_law_1.2,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,power_law_1.01,1.1674943923950196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,power_law_1.2,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,power_law_1.2,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,power_law_1.01,1.8303871154785156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,power_law_1.2,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,power_law_1.01,3.566304016113281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,power_law_1.2,0.09195520281791687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,power_law_1.2,0.0934719979763031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,power_law_1.2,0.09633920192718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,power_law_1.01,0.11195520162582398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,power_law_1.2,0.09572479724884034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,power_law_1.01,0.07955200076103211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,power_law_1.01,0.15661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,power_law_1.01,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,power_law_1.2,0.10287359952926636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,power_law_1.01,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,power_law_1.01,0.08897280097007751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,power_law_1.2,0.1090432047843933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,power_law_1.01,0.08794879913330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,power_law_1.2,0.12254719734191895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,power_law_1.01,0.09473279714584351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,power_law_1.01,0.09612799882888794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,power_law_1.2,0.140774405002594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,power_law_1.01,0.08533759713172913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,power_law_1.01,0.10964479446411132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,power_law_1.2,0.15880320072174073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,power_law_1.01,0.09434880018234253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,power_law_1.01,0.11720960140228272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,power_law_1.2,0.19585920572280885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,power_law_1.01,0.09251840114593506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,power_law_1.01,0.14672640562057496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,power_law_1.2,0.22534399032592772
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,power_law_1.01,0.0886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,power_law_1.01,0.1518336057662964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,power_law_1.2,0.2976576089859009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,power_law_1.01,0.09516800045967103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,power_law_1.01,0.18523520231246948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,power_law_1.2,0.3642175912857056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,power_law_1.2,0.15639679431915282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,power_law_1.01,0.22392959594726564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,power_law_1.2,0.486681604385376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,power_law_1.01,0.09414399862289428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,power_law_1.2,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,power_law_1.01,0.2947776079177856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,power_law_1.01,0.09924479722976684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,power_law_1.2,0.6357823848724365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,power_law_1.2,0.09783040285110474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,power_law_1.01,0.3730175971984863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,power_law_1.2,0.8739583969116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,power_law_1.01,0.10029439926147461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,power_law_1.2,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,power_law_1.01,0.5317376136779786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,power_law_1.01,0.09906560182571411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,power_law_1.2,1.005452823638916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,power_law_1.2,0.09371520280838012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,power_law_1.01,0.6851456165313721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,power_law_1.01,0.10192639827728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,power_law_1.2,1.3910719871520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,power_law_1.2,0.08756480216979981
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,power_law_1.01,0.731001615524292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,power_law_1.01,0.10191999673843384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,power_law_1.2,1.9243776321411132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,power_law_1.2,0.08983039855957031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,power_law_1.01,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,power_law_1.01,1.250175952911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,power_law_1.2,3.935103988647461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,power_law_1.2,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,power_law_1.01,0.1224128007888794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,power_law_1.01,3.00817928314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,power_law_1.2,0.0949504017829895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,power_law_1.01,0.13468159437179567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,power_law_1.2,0.08961920142173767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,power_law_1.01,0.14635519981384276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,power_law_1.2,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,power_law_1.01,0.17688319683074952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,power_law_1.01,0.18547199964523314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,power_law_1.2,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,power_law_1.01,0.23709440231323242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,power_law_1.2,0.09904000163078308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,power_law_1.01,0.29054720401763917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,power_law_1.2,0.10028799772262573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,power_law_1.01,0.37839999198913576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,power_law_1.2,0.10481280088424683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,power_law_1.01,0.4801919937133789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,power_law_1.2,0.11831040382385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,power_law_1.2,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,power_law_1.01,0.6280704021453858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,power_law_1.2,0.14778239727020265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,power_law_1.01,0.8285440444946289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,power_law_1.01,0.2040640115737915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,power_law_1.2,0.15640319585800172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,power_law_1.2,0.10577280521392822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,power_law_1.01,0.09962239861488342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,power_law_1.01,1.0079615592956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,power_law_1.2,0.10003839731216431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,power_law_1.2,0.20151679515838622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,power_law_1.01,0.09429759979248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,power_law_1.01,1.5821951866149901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,power_law_1.2,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,power_law_1.2,0.19898879528045654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,power_law_1.01,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,power_law_1.01,3.338163375854492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,power_law_1.2,0.07052159905433655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,power_law_1.2,0.27803521156311034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,power_law_1.01,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,power_law_1.2,0.07710080146789551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,power_law_1.2,0.30385279655456543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,power_law_1.01,0.0840448021888733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,power_law_1.2,0.07853440046310425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,power_law_1.01,0.08731520175933838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,power_law_1.2,0.4564223766326904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,power_law_1.2,0.08283519744873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,power_law_1.01,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,power_law_1.2,0.5444736003875732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,power_law_1.2,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,power_law_1.01,0.08936960101127625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,power_law_1.2,0.7765376091003418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,power_law_1.2,0.09430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,power_law_1.01,0.08773120045661927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,power_law_1.2,1.1142463684082031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,power_law_1.2,0.09592959880828858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,power_law_1.01,0.0934656023979187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,power_law_1.2,1.4361791610717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,power_law_1.2,0.09327999949455261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,power_law_1.01,0.09387519955635071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,power_law_1.2,2.131679916381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,power_law_1.2,0.09307519793510437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,power_law_1.01,0.09919999837875366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,power_law_1.2,0.09285759925842285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,power_law_1.01,0.09838719964027405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,power_law_1.2,4.53111686706543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,power_law_1.2,0.10106240510940552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,power_law_1.01,0.10617599487304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,power_law_1.01,0.09434239864349366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,power_law_1.01,0.11128319501876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,power_law_1.01,0.10192639827728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,power_law_1.01,0.11743359565734864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,power_law_1.01,0.09496319890022278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,power_law_1.01,0.1378432035446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,power_law_1.01,0.061343997716903687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,power_law_1.01,0.13954559564590455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,power_law_1.01,0.0662335991859436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,power_law_1.01,0.15735679864883423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,power_law_1.01,0.07325440049171447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,power_law_1.01,0.17968640327453614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,power_law_1.01,0.07815679907798767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,power_law_1.01,0.22310400009155273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,power_law_1.01,0.2552704095840454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,power_law_1.01,0.34110078811645506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,power_law_1.2,0.10805120468139648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,power_law_1.01,0.43425917625427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,power_law_1.2,0.10232959985733033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,power_law_1.01,0.62391037940979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,power_law_1.2,0.08511360287666321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,power_law_1.01,0.7306111812591553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,power_law_1.2,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,power_law_1.01,0.9108415603637695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,power_law_1.2,0.06937599778175355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,power_law_1.01,1.4193344116210938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,power_law_1.2,0.07304319739341736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,power_law_1.01,2.6749696731567383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,power_law_1.2,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,power_law_1.2,0.08306559920310974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,power_law_1.2,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,power_law_1.2,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,power_law_1.2,0.09741439819335937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,power_law_1.2,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,power_law_1.2,0.09463679790496826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,power_law_1.2,0.10314240455627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,power_law_1.2,0.10682879686355591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,power_law_1.2,0.11256959438323974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,power_law_1.2,0.13960319757461548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,power_law_1.2,0.15107200145721436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,power_law_1.01,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,power_law_1.2,0.18424960374832153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,power_law_1.01,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,power_law_1.2,0.1801535964012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,power_law_1.01,0.11885440349578857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,power_law_1.2,0.23299200534820558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,power_law_1.01,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,power_law_1.2,0.2710848093032837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,power_law_1.01,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,power_law_1.2,0.35834240913391113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,power_law_1.01,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,power_law_1.2,0.43921918869018556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,power_law_1.01,0.07709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,power_law_1.2,0.6239168167114257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,power_law_1.01,0.08814079761505127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,power_law_1.2,0.8813823699951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,power_law_1.01,0.0906112015247345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,power_law_1.2,1.0071295738220214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,power_law_1.01,0.09141759872436524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,power_law_1.2,1.531827163696289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,power_law_1.01,0.09224320054054261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,power_law_1.01,0.09735680222511292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,power_law_1.2,3.4683582305908205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,power_law_1.01,0.09755520224571228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,power_law_1.01,0.10206719636917114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,power_law_1.01,0.1082111954689026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,power_law_1.01,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,power_law_1.01,0.11578880548477173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,power_law_1.01,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,power_law_1.01,0.13893760442733766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,power_law_1.01,0.17415679693222047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,power_law_1.01,0.1913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,power_law_1.01,0.23355519771575928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,power_law_1.01,0.27799038887023925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,power_law_1.01,0.34325759410858153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,power_law_1.01,0.4449024200439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,power_law_1.2,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,power_law_1.01,0.5935999870300293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,power_law_1.2,0.07385600209236146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,power_law_1.01,0.7776639938354493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,power_law_1.2,0.059935998916625974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,power_law_1.01,0.8928000450134277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,power_law_1.01,1.401318359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,power_law_1.2,0.06970239877700805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,power_law_1.01,2.720025634765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,power_law_1.2,0.08922240138053894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,power_law_1.2,0.09291520118713378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,power_law_1.2,0.09290879964828491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,power_law_1.2,0.09781759977340698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,power_law_1.2,0.09804159998893738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,power_law_1.2,0.10109440088272095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,power_law_1.2,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,power_law_1.2,0.11297919750213622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,power_law_1.2,0.11584639549255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,power_law_1.2,0.134278404712677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,power_law_1.2,0.14759039878845215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,power_law_1.2,0.18220160007476807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,power_law_1.2,0.19899519681930541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,power_law_1.01,0.06069759726524353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,power_law_1.2,0.2359935998916626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,power_law_1.01,0.06725760102272034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,power_law_1.2,0.2829632043838501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,power_law_1.01,0.09182720184326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,power_law_1.2,0.359116792678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,power_law_1.2,0.48510079383850097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,power_law_1.01,0.06685439944267273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,power_law_1.2,0.7150847911834717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,power_law_1.2,0.8471232414245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,power_law_1.01,0.08056319952011108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,power_law_1.2,1.0675456047058105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,power_law_1.01,0.09205120205879211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,power_law_1.2,1.6829439163208009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,power_law_1.01,0.09472000002861022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,power_law_1.01,0.09653760194778442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,power_law_1.2,3.248876953125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,power_law_1.01,0.09919360280036926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,power_law_1.01,0.10057599544525146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,power_law_1.01,0.10203520059585572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,power_law_1.01,0.10616320371627808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,power_law_1.01,0.11232000589370728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,power_law_1.01,0.11818239688873292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,power_law_1.01,0.12543359994888306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,power_law_1.01,0.13894399404525756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,power_law_1.01,0.1526528000831604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,power_law_1.01,0.19710079431533814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,power_law_1.01,0.20938880443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,power_law_1.01,0.27000319957733154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,power_law_1.2,0.10657279491424561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,power_law_1.01,0.3291968107223511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,power_law_1.2,0.10536320209503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,power_law_1.01,0.42318081855773926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,power_law_1.2,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,power_law_1.2,0.11130239963531494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,power_law_1.01,0.5268288135528565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,power_law_1.2,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,power_law_1.2,0.1264575958251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,power_law_1.01,0.7543551921844482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,power_law_1.2,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,power_law_1.2,0.14856319427490233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,power_law_1.01,0.8915648460388184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,power_law_1.2,0.057894402742385866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,power_law_1.2,0.1725376009941101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,power_law_1.01,1.0842944145202638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,power_law_1.2,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,power_law_1.2,0.20202879905700682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,power_law_1.2,0.24769279956817628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,power_law_1.01,1.6501567840576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,power_law_1.01,0.08405759930610657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,power_law_1.2,0.27307519912719724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,power_law_1.01,0.08492159843444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,power_law_1.01,3.2688961029052734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,power_law_1.2,0.08758400082588196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,power_law_1.2,0.39738879203796384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,power_law_1.01,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,power_law_1.2,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,power_law_1.2,0.47808637619018557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,power_law_1.01,0.09168000221252441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,power_law_1.2,0.09475839734077454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,power_law_1.2,0.6962111949920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,power_law_1.01,0.0933184027671814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,power_law_1.2,0.09662719964981079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,power_law_1.2,0.9411328315734864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,power_law_1.01,0.09516159892082214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,power_law_1.2,0.09824000000953674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,power_law_1.01,0.09845119714736938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,power_law_1.2,1.129747200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,power_law_1.2,0.09966719746589661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,power_law_1.01,0.10643199682235718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,power_law_1.2,1.6698112487792969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,power_law_1.2,0.10622719526290894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,power_law_1.01,0.10928640365600586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,power_law_1.2,0.11644799709320068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,power_law_1.2,4.066790390014648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,power_law_1.01,0.11051520109176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,power_law_1.2,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,power_law_1.01,0.12362879514694214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,power_law_1.2,0.125273597240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,power_law_1.01,0.1416383981704712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,power_law_1.2,0.14533120393753052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,power_law_1.01,0.17052160501480101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,power_law_1.2,0.1596735954284668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,power_law_1.01,0.18302079439163207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,power_law_1.2,0.19326080083847047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,power_law_1.01,0.21169919967651368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,power_law_1.2,0.21987199783325195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,power_law_1.01,0.24650239944458008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,power_law_1.2,0.2886784076690674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,power_law_1.01,0.3161535978317261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,power_law_1.2,0.33087360858917236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,power_law_1.01,0.060288000106811526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,power_law_1.01,0.4217984199523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,power_law_1.2,0.4547776222229004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,power_law_1.01,0.06438400149345398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,power_law_1.2,0.561683177947998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,power_law_1.01,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,power_law_1.2,0.7818560123443603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,power_law_1.01,0.06172800064086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,power_law_1.2,0.9366847991943359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,power_law_1.01,0.06828160285949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,power_law_1.2,1.2358976364135743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,power_law_1.01,0.08138880133628845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,power_law_1.01,0.08568959832191467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,power_law_1.2,1.7739072799682618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,power_law_1.01,0.09960319995880126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,power_law_1.2,3.645158386230469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,power_law_1.2,0.0621504008769989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,power_law_1.01,0.10432000160217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,power_law_1.2,0.0652288019657135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,power_law_1.01,0.10616320371627808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,power_law_1.2,0.06563199758529663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,power_law_1.01,0.11455999612808228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,power_law_1.2,0.06439039707183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,power_law_1.01,0.11969280242919922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,power_law_1.2,0.0713599979877472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,power_law_1.01,0.1192896008491516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,power_law_1.01,0.03144319951534271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,power_law_1.2,0.07627519965171814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,power_law_1.01,0.1229632019996643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,power_law_1.01,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,power_law_1.01,0.13116159439086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,power_law_1.2,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,power_law_1.01,0.032076799869537355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,power_law_1.01,0.03126400113105774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,power_law_1.01,0.1340224027633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,power_law_1.2,0.09676799774169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,power_law_1.01,0.031673601269721983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,power_law_1.2,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,power_law_1.01,0.14303359985351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,power_law_1.01,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,power_law_1.01,0.03413119912147522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,power_law_1.2,0.10454399585723877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,power_law_1.01,0.16637439727783204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,power_law_1.01,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,power_law_1.2,0.10863360166549682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,power_law_1.01,0.18789119720458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,power_law_1.01,0.03454720079898834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,power_law_1.2,0.11355520486831665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,power_law_1.01,0.2323199987411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,power_law_1.2,0.11662720441818238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,power_law_1.01,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,power_law_1.01,0.2581376075744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,power_law_1.01,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,power_law_1.2,0.12584320306777955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,power_law_1.01,0.3439487934112549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,power_law_1.01,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,power_law_1.2,0.13137279748916625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,power_law_1.01,0.047654399275779726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,power_law_1.01,0.4621119976043701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,power_law_1.01,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,power_law_1.2,0.1371072053909302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,power_law_1.01,0.5878399848937989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,power_law_1.01,0.04826239943504333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,power_law_1.01,0.05358080267906189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,power_law_1.2,0.14773759841918946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,power_law_1.01,0.7113408088684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,power_law_1.01,0.05912320017814636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,power_law_1.2,0.16966400146484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,power_law_1.01,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,power_law_1.2,0.18892159461975097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,power_law_1.01,0.12117120027542114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,power_law_1.2,0.23971199989318848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,power_law_1.01,0.14124159812927245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,power_law_1.01,0.19480960369110106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,power_law_1.01,0.25347199440002444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,power_law_1.01,0.36734719276428224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,power_law_1.01,0.4596992015838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,power_law_1.01,0.5555456161499024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,power_law_1.01,0.8858176231384277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,power_law_1.01,1.7939264297485351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,power_law_1.2,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,power_law_1.2,0.034764799475669864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,power_law_1.2,0.03187839984893799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,power_law_1.2,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,power_law_1.2,0.03167999982833862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,power_law_1.2,0.03434880077838898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,power_law_1.2,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,power_law_1.2,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,power_law_1.2,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,power_law_1.2,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,power_law_1.2,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,power_law_1.2,0.04863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,power_law_1.2,0.0744704008102417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,power_law_1.2,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,power_law_1.2,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,power_law_1.2,0.14043519496917725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,power_law_1.2,0.19981440305709838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,power_law_1.2,0.25756158828735354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,power_law_1.2,0.3762943983078003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,power_law_1.2,0.4478271961212158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,power_law_1.2,0.5899648189544677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,power_law_1.2,0.9436479568481445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,power_law_1.2,1.813222312927246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,power_law_1.01,0.032691198587417605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,power_law_1.01,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,power_law_1.01,0.03391999900341034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,power_law_1.01,0.03223040103912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,power_law_1.01,0.032691198587417605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,power_law_1.01,0.03475840091705322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,power_law_1.01,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,power_law_1.01,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,power_law_1.01,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,power_law_1.01,0.036287999153137206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,power_law_1.01,0.03638400137424469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,power_law_1.01,0.03741439878940582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,power_law_1.01,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,power_law_1.01,0.040064001083374025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,power_law_1.01,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,power_law_1.01,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,power_law_1.01,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,power_law_1.01,0.057196801900863646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,power_law_1.01,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,power_law_1.01,0.09556480050086975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,power_law_1.01,0.12117120027542114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,power_law_1.01,0.1432960033416748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,power_law_1.01,0.20432000160217284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,power_law_1.01,0.23832321166992188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,power_law_1.01,0.3788032054901123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,power_law_1.01,0.43840641975402833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,power_law_1.01,0.6372352123260498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,power_law_1.01,0.9207103729248047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,power_law_1.01,1.8451007843017577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,power_law_1.2,0.032678401470184325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,power_law_1.2,0.032595199346542356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,power_law_1.2,0.03221760094165802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,power_law_1.2,0.033471998572349546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,power_law_1.2,0.03434880077838898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,power_law_1.2,0.03535360097885132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,power_law_1.2,0.036800000071525577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,power_law_1.2,0.03681280016899109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,power_law_1.01,0.58504319190979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,power_law_1.2,0.03760640025138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,power_law_1.01,0.7544064044952392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,power_law_1.2,0.04477440118789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,power_law_1.01,0.8940928459167481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,power_law_1.2,0.04577920138835907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,power_law_1.2,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,power_law_1.01,1.353452777862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,power_law_1.2,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,power_law_1.2,0.07816960215568543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,power_law_1.01,2.5603456497192383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,power_law_1.2,0.09303680062294006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,power_law_1.2,0.13222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,power_law_1.2,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,power_law_1.2,0.22069759368896485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,power_law_1.2,0.2895040035247803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,power_law_1.2,0.40229120254516604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,power_law_1.2,0.5117119789123535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,power_law_1.2,0.6622528076171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,power_law_1.2,1.0001728057861328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,power_law_1.01,0.033913600444793704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,power_law_1.2,1.9620479583740233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,power_law_1.01,0.03516159951686859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,power_law_1.01,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,power_law_1.01,0.033932799100875856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,power_law_1.01,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,power_law_1.01,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,power_law_1.01,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,power_law_1.01,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,power_law_1.01,0.03960959911346436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,power_law_1.01,0.04046719968318939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,power_law_1.2,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,power_law_1.01,0.041920000314712526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,power_law_1.01,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,power_law_1.2,0.03426559865474701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,power_law_1.01,0.04847359955310822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,power_law_1.01,0.05256959795951843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,power_law_1.2,0.03535360097885132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,power_law_1.01,0.056857597827911374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,power_law_1.2,0.035980799794197084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,power_law_1.01,0.06567680239677429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,power_law_1.2,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,power_law_1.01,0.07427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,power_law_1.2,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,power_law_1.01,0.09578239917755127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,power_law_1.2,0.038227200508117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,power_law_1.01,0.11584639549255371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,power_law_1.2,0.037811198830604555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,power_law_1.01,0.16357120275497436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,power_law_1.2,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,power_law_1.01,0.9829055786132812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,power_law_1.01,0.19141119718551636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,power_law_1.2,0.04088320136070252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,power_law_1.01,0.26963200569152834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,power_law_1.01,1.2026559829711914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,power_law_1.01,0.3237056016921997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,power_law_1.2,0.04987519979476929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,power_law_1.01,1.5239808082580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,power_law_1.01,0.4920703887939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,power_law_1.2,0.05111680030822754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,power_law_1.2,0.2827199935913086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,power_law_1.01,0.6479231834411621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,power_law_1.2,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,power_law_1.01,2.2442815780639647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,power_law_1.2,0.3465984106063843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,power_law_1.01,0.7757247924804688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,power_law_1.01,1.281766414642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,power_law_1.2,0.49528961181640624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,power_law_1.01,4.162630462646485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,power_law_1.2,0.09453439712524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,power_law_1.01,2.4706304550170897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,power_law_1.2,0.6087423801422119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,power_law_1.2,0.13100800514221192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,power_law_1.2,0.1668287992477417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,power_law_1.2,0.720358419418335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,power_law_1.2,0.20103039741516113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,power_law_1.2,0.27306880950927737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,power_law_1.2,1.0564352035522462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,power_law_1.2,0.3513535976409912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,power_law_1.2,1.2559103965759277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,power_law_1.2,0.5182720184326172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,power_law_1.2,0.6433919906616211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,power_law_1.2,1.630086326599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,power_law_1.2,0.813811206817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,power_law_1.01,0.03633280098438263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,power_law_1.2,2.468537521362305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,power_law_1.2,1.2457216262817383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,power_law_1.01,0.03489919900894165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,power_law_1.2,2.5980159759521486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,power_law_1.2,0.036396801471710205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,power_law_1.2,4.861427307128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,power_law_1.2,0.035571199655532834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,power_law_1.01,0.03550719916820526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,power_law_1.01,0.035718399286270144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,power_law_1.01,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,power_law_1.2,0.036601600050926206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,power_law_1.01,0.03735679984092712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,power_law_1.2,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,power_law_1.01,0.03837440013885498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,power_law_1.01,0.03961600065231323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,power_law_1.2,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,power_law_1.01,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,power_law_1.2,0.0648256003856659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,power_law_1.01,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,power_law_1.2,0.08735359907150268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,power_law_1.01,0.04431360065937042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,power_law_1.01,0.05766400098800659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,power_law_1.01,0.04984959959983826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,power_law_1.2,0.05886719822883606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,power_law_1.01,0.05085440278053284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,power_law_1.2,0.05846400260925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,power_law_1.01,0.06053760051727295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,power_law_1.01,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,power_law_1.2,0.058259201049804685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,power_law_1.01,0.06440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,power_law_1.2,0.0621504008769989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,power_law_1.01,0.07893760204315185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,power_law_1.01,0.060147202014923094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,power_law_1.01,0.09838719964027405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,power_law_1.2,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,power_law_1.01,0.06115840077400207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,power_law_1.01,0.11805440187454223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,power_law_1.2,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,power_law_1.01,0.0599232017993927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,power_law_1.01,0.1540992021560669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,power_law_1.2,0.06398720145225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,power_law_1.01,0.1872704029083252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,power_law_1.01,0.06155520081520081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,power_law_1.01,0.2364288091659546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,power_law_1.2,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,power_law_1.01,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,power_law_1.01,0.3355520009994507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,power_law_1.2,0.06870399713516236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,power_law_1.01,0.06729599833488464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,power_law_1.01,0.5137152194976806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,power_law_1.2,0.0705407977104187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,power_law_1.01,0.0689408004283905
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,power_law_1.01,0.6961855888366699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,power_law_1.2,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,power_law_1.01,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,power_law_1.01,0.7621503829956054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,power_law_1.2,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,power_law_1.01,1.2362496376037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,power_law_1.01,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,power_law_1.2,0.08650239706039428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,power_law_1.01,2.4799999237060546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,power_law_1.01,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,power_law_1.2,0.09265919923782348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,power_law_1.01,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,power_law_1.2,0.10535039901733398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,power_law_1.01,0.1051967978477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,power_law_1.2,0.12215039730072022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,power_law_1.01,0.11831040382385254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,power_law_1.2,0.12686079740524292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,power_law_1.01,0.14328960180282593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,power_law_1.01,0.1686911940574646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,power_law_1.2,0.15531519651412964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,power_law_1.01,0.2182528018951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,power_law_1.2,0.18154879808425903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,power_law_1.01,0.2727231979370117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,power_law_1.2,0.2354048013687134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,power_law_1.01,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,power_law_1.01,0.3681600093841553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,power_law_1.01,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,power_law_1.2,0.2980736017227173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,power_law_1.01,0.07237120270729065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,power_law_1.01,0.4490623950958252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,power_law_1.2,0.4254591941833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,power_law_1.01,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,power_law_1.01,0.6638271808624268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,power_law_1.2,0.5554880142211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,power_law_1.01,0.05927039980888367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,power_law_1.2,0.7392127990722657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,power_law_1.01,0.8329855918884277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,power_law_1.01,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,power_law_1.2,1.0846976280212401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,power_law_1.01,1.02225923538208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,power_law_1.01,0.059468799829483034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,power_law_1.2,1.3570816040039062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,power_law_1.01,1.6956607818603515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,power_law_1.01,0.06233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,power_law_1.2,2.314316749572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,power_law_1.01,3.373798370361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,power_law_1.01,0.06478719711303711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,power_law_1.2,4.501177597045898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,power_law_1.01,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,power_law_1.01,0.06951040029525757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,power_law_1.01,0.07319039702415467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,power_law_1.01,0.0738048017024994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,power_law_1.01,0.0809664011001587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,power_law_1.01,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,power_law_1.01,0.08977919816970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,power_law_1.2,0.06873599886894226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,power_law_1.01,0.10146559476852417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,power_law_1.2,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,power_law_1.01,0.11640959978103638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,power_law_1.01,0.07157120108604431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,power_law_1.01,0.14590079784393312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,power_law_1.2,0.05358080267906189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,power_law_1.01,0.16535040140151977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,power_law_1.2,0.056441599130630495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,power_law_1.01,0.05560960173606873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,power_law_1.01,0.20938239097595215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,power_law_1.01,0.058259201049804685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,power_law_1.01,0.24583680629730226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,power_law_1.01,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,power_law_1.2,0.06157439947128296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,power_law_1.01,0.3400320053100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,power_law_1.2,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,power_law_1.01,0.0646016001701355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,power_law_1.01,0.44245119094848634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,power_law_1.01,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,power_law_1.01,0.6189888000488282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,power_law_1.01,0.06846719980239868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,power_law_1.01,0.8076031684875489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,power_law_1.2,0.06751999855041504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,power_law_1.01,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,power_law_1.01,1.007084846496582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,power_law_1.2,0.07182080149650574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,power_law_1.01,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,power_law_1.01,1.5915776252746583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,power_law_1.2,0.07487360239028931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,power_law_1.01,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,power_law_1.2,0.08266879916191101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,power_law_1.01,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,power_law_1.01,2.9270912170410157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,power_law_1.2,0.08511360287666321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,power_law_1.01,0.08283519744873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,power_law_1.2,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,power_law_1.2,0.10805120468139648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,power_law_1.01,0.09205120205879211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,power_law_1.2,0.11870080232620239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,power_law_1.01,0.10904959440231324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,power_law_1.2,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,power_law_1.2,0.17401599884033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,power_law_1.01,0.14591360092163086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,power_law_1.2,0.23256959915161132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,power_law_1.01,0.1692352056503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,power_law_1.2,0.0832256019115448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,power_law_1.2,0.2628864049911499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,power_law_1.01,0.2143104076385498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,power_law_1.2,0.06542080044746398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,power_law_1.01,0.25896320343017576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,power_law_1.2,0.3824959993362427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,power_law_1.2,0.052102398872375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,power_law_1.01,0.3466048002243042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,power_law_1.2,0.48919038772583007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,power_law_1.2,0.054150402545928955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,power_law_1.01,0.4355008125305176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,power_law_1.2,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,power_law_1.2,0.7167168140411377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,power_law_1.2,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,power_law_1.01,0.6128384113311768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,power_law_1.2,0.9591872215270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,power_law_1.2,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,power_law_1.01,0.7723840236663818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,power_law_1.2,1.1375871658325196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,power_law_1.2,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,power_law_1.01,0.9939840316772461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,power_law_1.2,1.969068717956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,power_law_1.2,0.06766719818115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,power_law_1.01,1.5260607719421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,power_law_1.2,0.0693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,power_law_1.2,4.0041664123535154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,power_law_1.01,3.0535871505737306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,power_law_1.2,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,power_law_1.2,0.07995520234107971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,power_law_1.2,0.07626879811286927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,power_law_1.2,0.08589439988136291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,power_law_1.2,0.09265279769897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,power_law_1.2,0.09879040122032165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,power_law_1.2,0.1115007996559143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,power_law_1.01,0.07180799841880799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,power_law_1.2,0.11968640089035035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,power_law_1.01,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,power_law_1.2,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,power_law_1.2,0.15327359437942506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,power_law_1.01,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,power_law_1.2,0.07402880191802978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,power_law_1.2,0.17375359535217286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,power_law_1.01,0.05399680137634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,power_law_1.2,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,power_law_1.01,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,power_law_1.2,0.2311039924621582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,power_law_1.2,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,power_law_1.01,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,power_law_1.2,0.2634495973587036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,power_law_1.01,0.06689280271530151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,power_law_1.2,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,power_law_1.2,0.3795775890350342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,power_law_1.01,0.06894720196723939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,power_law_1.2,0.06870399713516236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,power_law_1.2,0.48299517631530764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,power_law_1.01,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,power_law_1.2,0.06869120001792908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,power_law_1.2,0.690451192855835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,power_law_1.2,0.07095680236816407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,power_law_1.01,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,power_law_1.2,0.8522496223449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,power_law_1.01,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,power_law_1.2,0.07197440266609192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,power_law_1.2,1.1416255950927734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,power_law_1.01,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,power_law_1.2,0.07873280048370361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,power_law_1.2,1.6116479873657226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,power_law_1.2,0.08078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,power_law_1.2,0.08303999900817871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,power_law_1.2,3.8236927032470702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,power_law_1.01,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,power_law_1.2,0.0889792025089264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,power_law_1.01,0.0980288028717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,power_law_1.2,0.09799039959907532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,power_law_1.01,0.10353920459747315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,power_law_1.2,0.10105600357055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,power_law_1.01,0.11789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,power_law_1.2,0.10720000267028809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,power_law_1.01,0.1277184009552002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,power_law_1.2,0.12215679883956909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,power_law_1.01,0.149017596244812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,power_law_1.2,0.13238400220870972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,power_law_1.01,0.17440639734268187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,power_law_1.2,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,power_law_1.01,0.22520320415496825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,power_law_1.2,0.1870784044265747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,power_law_1.2,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,power_law_1.01,0.266975998878479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,power_law_1.2,0.23598721027374267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,power_law_1.2,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,power_law_1.01,0.06828160285949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,power_law_1.01,0.37020800113677976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,power_law_1.2,0.27740159034729006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,power_law_1.2,0.04867840111255646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,power_law_1.01,0.0686847984790802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,power_law_1.2,0.050732797384262084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,power_law_1.01,0.4850815773010254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,power_law_1.2,0.4014848232269287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,power_law_1.01,0.05374079942703247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,power_law_1.01,0.6917119979858398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,power_law_1.2,0.5165631771087646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,power_law_1.2,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,power_law_1.01,0.05578240156173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,power_law_1.01,0.8512895584106446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,power_law_1.2,0.7199488162994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,power_law_1.2,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,power_law_1.01,1.0226943969726563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,power_law_1.2,0.9435903549194335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,power_law_1.01,0.0682752013206482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,power_law_1.2,0.11790080070495605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,power_law_1.01,0.07299200296401978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,power_law_1.2,0.15947519540786742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,power_law_1.01,1.594092845916748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,power_law_1.2,1.1318016052246094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,power_law_1.2,0.1932736039161682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,power_law_1.01,0.076883202791214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,power_law_1.2,1.6992895126342773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,power_law_1.2,0.2874687910079956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,power_law_1.01,3.26033935546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,power_law_1.01,0.07831680178642272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,power_law_1.2,0.33907198905944824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,power_law_1.2,3.706553649902344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,power_law_1.01,0.07953280210494995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,power_law_1.2,0.5903615951538086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,power_law_1.01,0.08692479729652405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,power_law_1.2,0.6272319793701172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,power_law_1.2,0.9645503997802735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,power_law_1.01,0.09326080083847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,power_law_1.2,1.3861503601074219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,power_law_1.01,0.0934719979763031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,power_law_1.2,2.5435455322265623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,power_law_1.01,0.09096959829330445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,power_law_1.01,0.09879680275917054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,power_law_1.01,0.10289920568466186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,power_law_1.01,0.11251200437545776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,power_law_1.01,0.12911360263824462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,power_law_1.2,0.061791998147964475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,power_law_1.01,0.14139519929885863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,power_law_1.2,0.06874240040779114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,power_law_1.01,0.17456640005111695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,power_law_1.2,0.05399680137634277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,power_law_1.01,0.1987391948699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,power_law_1.2,0.05767040252685547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,power_law_1.01,0.25075199604034426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,power_law_1.2,0.06136959791183472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,power_law_1.01,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,power_law_1.2,0.06661120057106018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,power_law_1.01,0.30687360763549804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,power_law_1.01,0.07157120108604431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,power_law_1.2,0.07692800164222717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,power_law_1.01,0.41848320960998536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,power_law_1.01,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,power_law_1.01,0.5300992012023926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,power_law_1.01,0.06664320230484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,power_law_1.2,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,power_law_1.2,0.06936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,power_law_1.01,0.7609151840209961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,power_law_1.2,0.08062080144882203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,power_law_1.2,0.06791039705276489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,power_law_1.01,0.08140159845352173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,power_law_1.01,1.0275584220886231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,power_law_1.2,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,power_law_1.2,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,power_law_1.01,0.0953279972076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,power_law_1.01,1.1821632385253906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,power_law_1.2,0.08717439770698547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,power_law_1.2,0.06177279949188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,power_law_1.01,0.09880319833755494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,power_law_1.01,1.8692928314208985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,power_law_1.2,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,power_law_1.2,0.06895999908447266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,power_law_1.01,0.09634559750556945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,power_law_1.2,0.09045119881629944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,power_law_1.2,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,power_law_1.01,0.10165760517120362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,power_law_1.01,3.6565696716308596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,power_law_1.2,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,power_law_1.2,0.09166079759597778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,power_law_1.01,0.10985599756240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,power_law_1.2,0.10458240509033204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,power_law_1.2,0.09557759761810303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,power_law_1.01,0.11314560174942016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,power_law_1.2,0.11011199951171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,power_law_1.2,0.09926400184631348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,power_law_1.01,0.1201024055480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,power_law_1.2,0.1293503999710083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,power_law_1.2,0.099891197681427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,power_law_1.01,0.1274880051612854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,power_law_1.2,0.14615679979324342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,power_law_1.2,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,power_law_1.01,0.14202239513397216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,power_law_1.01,0.03694719970226288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,power_law_1.2,0.17031680345535277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,power_law_1.01,0.1555392026901245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,power_law_1.01,0.036723199486732486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,power_law_1.2,0.20678400993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,power_law_1.2,0.11420799493789673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,power_law_1.01,0.1551103949546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,power_law_1.01,0.0357120007276535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,power_law_1.2,0.2641216039657593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,power_law_1.2,0.1291584014892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,power_law_1.01,0.1766144037246704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,power_law_1.2,0.13816959857940675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,power_law_1.2,0.3304768085479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,power_law_1.01,0.18030719757080077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,power_law_1.2,0.14328960180282593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,power_law_1.01,0.2184000015258789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,power_law_1.2,0.4593023777008057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,power_law_1.01,0.03612160086631775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,power_law_1.2,0.15312000513076782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,power_law_1.01,0.24585599899291993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,power_law_1.2,0.5706751823425293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,power_law_1.01,0.035724800825119016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,power_law_1.2,0.1805567979812622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,power_law_1.01,0.03715200126171112
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,power_law_1.01,0.3275712013244629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,power_law_1.2,0.859654426574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,power_law_1.01,0.03573760092258453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,power_law_1.2,0.1801535964012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,power_law_1.01,0.4019008159637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,power_law_1.2,1.0464511871337892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,power_law_1.2,0.22109439373016357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,power_law_1.01,0.5419839859008789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,power_law_1.2,1.228927993774414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,power_law_1.01,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,power_law_1.2,0.2678015947341919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,power_law_1.01,0.6757184028625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,power_law_1.2,1.940812873840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,power_law_1.01,0.03776639997959137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,power_law_1.2,0.34235520362854005
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,power_law_1.01,0.9575103759765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,power_law_1.01,0.03939839899539947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,power_law_1.2,0.4105535984039307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,power_law_1.2,4.180704116821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,power_law_1.01,0.041459199786186215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,power_law_1.01,1.223961639404297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,power_law_1.2,0.5555583953857421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,power_law_1.01,0.04472320079803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,power_law_1.01,1.4854911804199218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,power_law_1.01,0.04656639993190766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,power_law_1.2,0.6835455894470215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,power_law_1.01,2.302444839477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,power_law_1.01,0.0525056004524231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,power_law_1.2,0.9841919898986816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,power_law_1.01,0.06069759726524353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,power_law_1.01,4.387916946411133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,power_law_1.2,1.289145565032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,power_law_1.2,1.5539648056030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,power_law_1.2,0.03687680065631867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,power_law_1.01,0.06910719871520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,power_law_1.2,0.036582401394844054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,power_law_1.01,0.08545920252799988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,power_law_1.2,2.4772031784057615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,power_law_1.2,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,power_law_1.01,0.11312639713287354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,power_law_1.01,0.14097280502319337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,power_law_1.2,4.885248184204102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,power_law_1.2,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,power_law_1.01,0.19383039474487304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,power_law_1.01,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,power_law_1.01,0.23683199882507325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,power_law_1.01,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,power_law_1.01,0.34189438819885254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,power_law_1.01,0.03530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,power_law_1.2,0.03555200099945068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,power_law_1.01,0.4436863899230957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,power_law_1.2,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,power_law_1.01,0.037574398517608645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,power_law_1.01,0.5137152194976806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,power_law_1.2,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,power_law_1.01,0.03880319893360138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,power_law_1.01,0.915334415435791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,power_law_1.2,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,power_law_1.2,0.035366401076316833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,power_law_1.01,1.679225540161133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,power_law_1.2,0.034944000840187076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,power_law_1.2,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,power_law_1.2,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,power_law_1.2,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,power_law_1.2,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,power_law_1.2,0.04948480129241943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,power_law_1.2,0.036185601353645326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,power_law_1.2,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,power_law_1.2,0.03743360042572021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,power_law_1.2,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,power_law_1.2,0.037011200189590455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,power_law_1.01,0.0400191992521286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,power_law_1.2,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,power_law_1.2,0.03783040046691895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,power_law_1.01,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,power_law_1.2,0.07775359749794006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,power_law_1.01,0.03489919900894165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,power_law_1.2,0.09537280201911927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,power_law_1.2,0.04131200015544891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,power_law_1.01,0.03429119884967804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,power_law_1.2,0.14368640184402465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,power_law_1.2,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,power_law_1.01,0.03530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,power_law_1.2,0.17319040298461913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,power_law_1.2,0.041920000314712526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,power_law_1.01,0.03735679984092712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,power_law_1.2,0.2592128038406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,power_law_1.01,0.037145599722862244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,power_law_1.2,0.3153088092803955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,power_law_1.01,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,power_law_1.2,0.48879361152648926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,power_law_1.2,0.05072000026702881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,power_law_1.01,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,power_law_1.2,0.5571775913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,power_law_1.2,0.05809919834136963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,power_law_1.01,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,power_law_1.2,0.724505615234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,power_law_1.2,0.06195840239524841
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,power_law_1.01,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,power_law_1.2,0.07918720245361328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,power_law_1.2,1.1830464363098145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,power_law_1.01,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,power_law_1.2,0.09945600032806397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,power_law_1.01,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,power_law_1.2,2.3131328582763673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,power_law_1.2,0.13591040372848512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,power_law_1.2,0.1643839955329895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,power_law_1.01,0.04657280147075653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,power_law_1.2,0.24280960559844972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,power_law_1.01,0.04759680032730103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,power_law_1.2,0.28831360340118406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,power_law_1.01,0.05128960013389587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,power_law_1.2,0.5010752201080322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,power_law_1.01,0.06028159856796265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,power_law_1.2,0.6429823875427246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,power_law_1.2,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,power_law_1.01,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,power_law_1.2,0.7527872085571289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,power_law_1.01,0.08506240248680115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,power_law_1.2,1.228108787536621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,power_law_1.01,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,power_law_1.2,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,power_law_1.2,2.573036766052246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,power_law_1.01,0.13480960130691527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,power_law_1.01,0.18153599500656128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,power_law_1.2,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,power_law_1.01,0.21860480308532715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,power_law_1.2,0.03716480135917664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,power_law_1.01,0.3166975975036621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,power_law_1.2,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,power_law_1.01,0.4309696197509766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,power_law_1.01,0.5063168048858643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,power_law_1.01,0.8186688423156738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,power_law_1.01,0.034355199337005614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,power_law_1.2,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,power_law_1.01,1.4883584022521972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,power_law_1.01,0.03372800052165985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,power_law_1.01,0.034329599142074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,power_law_1.2,0.04826880097389221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,power_law_1.01,0.03681919872760773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,power_law_1.2,0.05051519870758057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,power_law_1.01,0.039263999462127684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,power_law_1.2,0.05011199712753296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,power_law_1.01,0.03885439932346344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,power_law_1.2,0.05808640122413635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,power_law_1.01,0.039059200882911684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,power_law_1.2,0.06280320286750793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,power_law_1.01,0.040268799662590025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,power_law_1.2,0.04349440038204193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,power_law_1.01,0.040889599919319154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,power_law_1.2,0.09166719913482665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,power_law_1.2,0.0344895988702774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,power_law_1.01,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,power_law_1.2,0.12034560441970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,power_law_1.2,0.034892800450325015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,power_law_1.01,0.04336000084877014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,power_law_1.2,0.14676480293273925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,power_law_1.2,0.03529599905014038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,power_law_1.01,0.046419200301170346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,power_law_1.2,0.2157952070236206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,power_law_1.2,0.03653120100498199
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,power_law_1.01,0.04578559994697571
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,power_law_1.2,0.25265278816223147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,power_law_1.2,0.03857919871807099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,power_law_1.01,0.049497601389884946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,power_law_1.2,0.3722496032714844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,power_law_1.01,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,power_law_1.2,0.5068031787872315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,power_law_1.2,0.04022400081157684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,power_law_1.01,0.05257599949836731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,power_law_1.2,0.6540671825408936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,power_law_1.2,0.041247999668121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,power_law_1.01,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,power_law_1.2,1.1097408294677735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,power_law_1.2,0.04166400134563446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,power_law_1.2,0.04350079894065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,power_law_1.01,0.07408000230789184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,power_law_1.2,2.3289152145385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,power_law_1.2,0.04371199905872345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,power_law_1.01,0.0920960009098053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,power_law_1.2,0.04552960097789764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,power_law_1.01,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,power_law_1.2,0.04471679925918579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,power_law_1.01,0.1438976049423218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,power_law_1.2,0.0500544011592865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,power_law_1.01,0.20145280361175538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,power_law_1.2,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,power_law_1.01,0.25061759948730467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,power_law_1.2,0.05333120226860046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,power_law_1.01,0.33498239517211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,power_law_1.2,0.05987200140953064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,power_law_1.01,0.4724031925201416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,power_law_1.2,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,power_law_1.01,0.04394879937171936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,power_law_1.01,0.5399936199188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,power_law_1.2,0.08385279774665833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,power_law_1.01,0.035359999537467955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,power_law_1.01,0.8875264167785645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,power_law_1.2,0.09326080083847046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,power_law_1.01,0.035366401076316833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,power_law_1.2,0.13114880323410033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,power_law_1.01,1.8378047943115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,power_law_1.01,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,power_law_1.2,0.1508095979690552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,power_law_1.01,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,power_law_1.2,0.21797120571136475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,power_law_1.01,0.04211199879646301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,power_law_1.2,0.2810688018798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,power_law_1.01,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,power_law_1.01,0.045184001326560974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,power_law_1.2,0.43507838249206543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,power_law_1.2,0.5210815906524658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,power_law_1.01,0.046828800439834596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,power_law_1.2,0.7473919868469239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,power_law_1.2,1.0846912384033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,power_law_1.01,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,power_law_1.2,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,power_law_1.01,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,power_law_1.2,2.5758527755737304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,power_law_1.2,0.033932799100875856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,power_law_1.01,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,power_law_1.2,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,power_law_1.01,0.056857597827911374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,power_law_1.2,0.03844479918479919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,power_law_1.01,0.05685120224952698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,power_law_1.2,0.04252800047397613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,power_law_1.01,0.0646336019039154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,power_law_1.2,0.04232960045337677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,power_law_1.01,0.07200639843940734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,power_law_1.2,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,power_law_1.01,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,power_law_1.2,0.04417920112609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,power_law_1.01,0.10314240455627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,power_law_1.2,0.0456063985824585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,power_law_1.01,0.1410367965698242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,power_law_1.2,0.045817598700523376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,power_law_1.01,0.1678655982017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,power_law_1.2,0.046988800168037415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,power_law_1.01,0.22111361026763915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,power_law_1.2,0.04847359955310822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,power_law_1.2,0.050521600246429446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,power_law_1.01,0.27640318870544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,power_law_1.01,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,power_law_1.01,0.40337281227111815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,power_law_1.01,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,power_law_1.2,0.06136959791183472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,power_law_1.01,0.04350079894065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,power_law_1.01,0.529747200012207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,power_law_1.01,0.04922879934310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,power_law_1.2,0.06032639741897583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,power_law_1.01,0.5977536201477051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,power_law_1.01,0.05086719989776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,power_law_1.01,1.001408004760742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,power_law_1.01,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,power_law_1.2,0.07408000230789184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,power_law_1.01,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,power_law_1.01,1.9350847244262694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,power_law_1.2,0.09721599817276001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,power_law_1.01,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,power_law_1.2,0.11308159828186035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,power_law_1.01,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,power_law_1.2,0.14902399778366088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,power_law_1.01,0.05230720043182373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,power_law_1.2,0.179750394821167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,power_law_1.01,0.05456640124320984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,power_law_1.2,0.26331520080566406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,power_law_1.01,0.057011198997497556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,power_law_1.2,0.3313024044036865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,power_law_1.01,0.06213759779930115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,power_law_1.2,0.4744448184967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,power_law_1.01,0.06378239989280701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,power_law_1.2,0.655289602279663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,power_law_1.01,0.06685439944267273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,power_law_1.2,0.8256832122802734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,power_law_1.01,0.07626240253448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,power_law_1.2,1.2551551818847657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,power_law_1.2,0.04008319973945618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,power_law_1.01,0.0906112015247345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,power_law_1.2,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,power_law_1.01,0.11149439811706544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,power_law_1.2,2.237779235839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,power_law_1.2,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,power_law_1.01,0.13032959699630736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,power_law_1.2,0.038848000764846805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,power_law_1.01,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,power_law_1.01,0.16842880249023437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,power_law_1.01,0.03777920007705689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,power_law_1.01,0.22330880165100098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,power_law_1.2,0.04865919947624207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,power_law_1.01,0.03776639997959137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,power_law_1.01,0.2810688018798828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,power_law_1.2,0.048467200994491574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,power_law_1.01,0.36012160778045654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,power_law_1.2,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,power_law_1.01,0.03920640051364899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,power_law_1.01,0.5301055908203125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,power_law_1.2,0.05441280007362366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,power_law_1.01,0.6503232002258301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,power_law_1.01,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,power_law_1.2,0.05622400045394897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,power_law_1.01,0.04105600118637085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,power_law_1.01,0.8231679916381835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,power_law_1.01,0.06382719874382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,power_law_1.2,0.05132160186767578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,power_law_1.01,0.0430976003408432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,power_law_1.01,0.049881601333618165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,power_law_1.01,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,power_law_1.01,1.270252799987793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,power_law_1.01,0.05093119740486145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,power_law_1.01,0.047603198885917665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,power_law_1.2,0.053376001119613645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,power_law_1.01,2.4160703659057616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,power_law_1.01,0.05256320238113403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,power_law_1.2,0.056652802228927615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,power_law_1.01,0.05557119846343994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,power_law_1.01,0.05564799904823303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,power_law_1.01,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,power_law_1.01,0.06071680188179016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,power_law_1.01,0.057068800926208495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,power_law_1.01,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,power_law_1.01,0.05767679810523987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,power_law_1.01,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,power_law_1.01,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,power_law_1.01,0.10966399908065796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,power_law_1.01,0.059935998916625974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,power_law_1.01,0.06322559714317322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,power_law_1.01,0.13607679605484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,power_law_1.01,0.06566399931907654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,power_law_1.01,0.19301120042800904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,power_law_1.2,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,power_law_1.01,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,power_law_1.01,0.24728960990905763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,power_law_1.2,0.057017600536346434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,power_law_1.01,0.06812800168991089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,power_law_1.01,0.3066688060760498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,power_law_1.2,0.051283198595047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,power_law_1.01,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,power_law_1.2,0.051692801713943484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,power_law_1.01,0.4526847839355469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,power_law_1.01,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,power_law_1.2,0.05354239940643311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,power_law_1.01,0.5645055770874023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,power_law_1.01,0.08369920253753663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,power_law_1.2,0.05722879767417908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,power_law_1.01,0.8657855987548828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,power_law_1.01,0.09352959990501404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,power_law_1.2,0.05906559824943543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,power_law_1.01,0.10704640150070191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,power_law_1.01,1.6855808258056642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,power_law_1.2,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,power_law_1.01,0.1295680046081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,power_law_1.2,0.06105599999427795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,power_law_1.01,0.14636160135269166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,power_law_1.01,0.18999040126800537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,power_law_1.2,0.06520959734916687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,power_law_1.01,0.22213759422302246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,power_law_1.2,0.06581760048866273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,power_law_1.2,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,power_law_1.01,0.3161535978317261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,power_law_1.2,0.07237120270729065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,power_law_1.01,0.41036162376403806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,power_law_1.2,0.0748416006565094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,power_law_1.01,0.5518720149993896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,power_law_1.01,0.07668480277061462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,power_law_1.2,0.0820032000541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,power_law_1.01,0.7216512203216553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,power_law_1.01,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,power_law_1.2,0.08794879913330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,power_law_1.01,0.8682815551757812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,power_law_1.01,0.053497600555419925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,power_law_1.2,0.09921280145645142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,power_law_1.01,1.4144895553588868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,power_law_1.01,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,power_law_1.2,0.1131327986717224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,power_law_1.01,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,power_law_1.2,0.13791999816894532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,power_law_1.01,2.767398452758789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,power_law_1.01,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,power_law_1.2,0.16843520402908324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,power_law_1.01,0.06090239882469177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,power_law_1.2,0.20366079807281495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,power_law_1.01,0.06275200247764587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,power_law_1.2,0.2593535900115967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,power_law_1.01,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,power_law_1.2,0.3756799936294556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,power_law_1.01,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,power_law_1.2,0.4654079914093018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,power_law_1.01,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,power_law_1.2,0.6005568027496337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,power_law_1.01,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,power_law_1.2,0.824403190612793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,power_law_1.2,0.07448959946632386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,power_law_1.01,0.07381119728088378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,power_law_1.2,1.0054335594177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,power_law_1.2,0.05052800178527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,power_law_1.01,0.08039039969444275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,power_law_1.2,1.7038080215454101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,power_law_1.2,0.05072640180587769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,power_law_1.01,0.08283519744873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,power_law_1.2,0.050316798686981204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,power_law_1.2,3.7692161560058595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,power_law_1.2,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,power_law_1.01,0.10536960363388062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,power_law_1.01,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,power_law_1.2,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,power_law_1.01,0.14261759519577027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,power_law_1.2,0.06116480231285095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,power_law_1.01,0.1606592059135437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,power_law_1.2,0.06281599998474122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,power_law_1.01,0.2077631950378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,power_law_1.2,0.06465920209884643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,power_law_1.01,0.2499392032623291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,power_law_1.2,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,power_law_1.01,0.33350400924682616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,power_law_1.2,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,power_law_1.01,0.4223936080932617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,power_law_1.2,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,power_law_1.01,0.596895980834961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,power_law_1.01,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,power_law_1.2,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,power_law_1.01,0.7527167797088623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,power_law_1.2,0.07631360292434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,power_law_1.01,0.9010047912597656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,power_law_1.01,0.05394560098648071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,power_law_1.2,0.08062719702720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,power_law_1.01,1.450476837158203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,power_law_1.01,0.05354239940643311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,power_law_1.01,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,power_law_1.2,0.10439039468765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,power_law_1.01,2.953299140930176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,power_law_1.01,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,power_law_1.2,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,power_law_1.01,0.06746240258216858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,power_law_1.2,0.14494080543518068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,power_law_1.01,0.07096319794654846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,power_law_1.2,0.16890239715576172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,power_law_1.01,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,power_law_1.2,0.21907200813293456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,power_law_1.01,0.07340160012245178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,power_law_1.2,0.2567487955093384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,power_law_1.01,0.07870079874992371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,power_law_1.2,0.34482560157775877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,power_law_1.01,0.07871999740600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,power_law_1.2,0.456006383895874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,power_law_1.01,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,power_law_1.2,0.645465612411499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,power_law_1.01,0.07910400032997131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,power_law_1.2,0.9248064041137696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,power_law_1.2,0.06605439782142639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,power_law_1.01,0.0887615978717804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,power_law_1.2,0.05416319966316223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,power_law_1.2,1.0683775901794434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,power_law_1.01,0.08938239812850952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,power_law_1.2,0.05271040201187134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,power_law_1.2,1.7063295364379882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,power_law_1.01,0.09470720291137695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,power_law_1.2,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,power_law_1.01,0.11395200490951538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,power_law_1.2,0.05866879820823669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,power_law_1.2,3.766815948486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,power_law_1.01,0.1289023995399475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,power_law_1.2,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,power_law_1.01,0.1493824005126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,power_law_1.2,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,power_law_1.01,0.1788800001144409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,power_law_1.2,0.06993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,power_law_1.01,0.2331455945968628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,power_law_1.2,0.07219200134277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,power_law_1.01,0.28393599987030027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,power_law_1.2,0.07545599937438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,power_law_1.01,0.37262721061706544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,power_law_1.2,0.0789247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,power_law_1.01,0.481766414642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,power_law_1.2,0.08199040293693542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,power_law_1.01,0.651148796081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,power_law_1.2,0.08017280101776122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,power_law_1.01,0.8512255668640136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,power_law_1.2,0.08734080195426941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,power_law_1.01,1.1166463851928712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,power_law_1.2,0.09184640049934387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,power_law_1.2,0.1027008056640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,power_law_1.01,1.5932160377502442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,power_law_1.2,0.11887359619140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,power_law_1.01,0.06158080101013184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,power_law_1.2,0.13178240060806273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,power_law_1.01,3.1979583740234374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,power_law_1.2,0.16019840240478517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,power_law_1.01,0.05397760272026062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,power_law_1.2,0.18113919496536254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,power_law_1.01,0.06504960060119629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,power_law_1.2,0.23274879455566405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,power_law_1.01,0.0748799979686737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,power_law_1.2,0.30176639556884766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,power_law_1.01,0.07653759717941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,power_law_1.2,0.3998656034469604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,power_law_1.01,0.08164479732513427
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,power_law_1.2,0.48833279609680175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,power_law_1.01,0.08165760040283203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,power_law_1.2,0.7760640144348144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,power_law_1.01,0.08574720025062561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,power_law_1.2,1.0613696098327636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,power_law_1.01,0.09149439930915833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,power_law_1.2,1.205958366394043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,power_law_1.01,0.09476479887962341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,power_law_1.01,0.09290879964828491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,power_law_1.2,1.9886911392211915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,power_law_1.01,0.10029439926147461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,power_law_1.2,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,power_law_1.01,0.1074560046195984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,power_law_1.2,4.142975997924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,power_law_1.2,0.0555840015411377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,power_law_1.01,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,power_law_1.2,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,power_law_1.01,0.11646080017089844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,power_law_1.2,0.05845119953155518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,power_law_1.01,0.1314239978790283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,power_law_1.2,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,power_law_1.01,0.15230079889297485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,power_law_1.01,0.18956799507141114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,power_law_1.2,0.07663999795913697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,power_law_1.01,0.21864960193634034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,power_law_1.2,0.07953919768333435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,power_law_1.01,0.2825536012649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,power_law_1.2,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,power_law_1.01,0.07442560195922851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,power_law_1.01,0.35669760704040526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,power_law_1.2,0.08425599932670594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,power_law_1.01,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,power_law_1.2,0.08773760199546814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,power_law_1.01,0.4597055912017822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,power_law_1.2,0.09326720237731934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,power_law_1.01,0.5522687911987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,power_law_1.01,0.07217919826507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,power_law_1.2,0.09511680006980897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,power_law_1.01,0.06442880034446716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,power_law_1.01,0.8101247787475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,power_law_1.2,0.10105600357055664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,power_law_1.01,1.0626432418823242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,power_law_1.2,0.10268800258636475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,power_law_1.01,0.0770687997341156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,power_law_1.01,1.3063551902770996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,power_law_1.2,0.11088000535964966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,power_law_1.2,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,power_law_1.01,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,power_law_1.01,2.0092287063598633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,power_law_1.2,0.06525440216064453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,power_law_1.2,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,power_law_1.01,0.07852799892425537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,power_law_1.2,0.07180160284042358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,power_law_1.2,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,power_law_1.01,4.071340942382813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,power_law_1.2,0.08163840174674988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,power_law_1.01,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,power_law_1.2,0.14056960344314576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,power_law_1.2,0.09697920083999634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,power_law_1.2,0.15489920377731323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,power_law_1.01,0.07626240253448487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,power_law_1.2,0.11646720170974731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,power_law_1.2,0.18358399868011474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,power_law_1.01,0.07950720191001892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,power_law_1.2,0.136735999584198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,power_law_1.2,0.22289280891418456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,power_law_1.01,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,power_law_1.2,0.178713595867157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,power_law_1.2,0.28270080089569094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,power_law_1.2,0.21230080127716064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,power_law_1.2,0.37363200187683104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,power_law_1.2,0.30302720069885253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,power_law_1.01,0.08651520013809204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,power_law_1.2,0.4977407932281494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,power_law_1.2,0.11052800416946411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,power_law_1.2,0.4265279769897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,power_law_1.01,0.0955136001110077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,power_law_1.2,0.6226496219635009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,power_law_1.2,0.09722239971160888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,power_law_1.2,0.5440896034240723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,power_law_1.01,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,power_law_1.2,0.8686335563659668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,power_law_1.2,0.06813439726829529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,power_law_1.2,0.704857587814331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,power_law_1.01,0.10536320209503174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,power_law_1.2,1.1514431953430175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,power_law_1.2,0.06054400205612183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,power_law_1.2,0.8985856056213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,power_law_1.01,0.12380160093307495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,power_law_1.2,1.4439167976379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,power_law_1.2,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,power_law_1.2,1.3776127815246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,power_law_1.01,0.1297279953956604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,power_law_1.2,2.2889215469360353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,power_law_1.2,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,power_law_1.2,3.136422348022461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,power_law_1.01,0.15634560585021973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,power_law_1.2,0.07222399711608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,power_law_1.2,4.3481792449951175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,power_law_1.01,0.18176640272140504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,power_law_1.2,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,power_law_1.01,0.24173440933227539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,power_law_1.2,0.07508479952812194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,power_law_1.01,0.28312320709228517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,power_law_1.2,0.07448319792747497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,power_law_1.01,0.37937920093536376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,power_law_1.2,0.08163840174674988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,power_law_1.01,0.4911935806274414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,power_law_1.2,0.08103039860725403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,power_law_1.2,0.08186240196228027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,power_law_1.01,0.677350378036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,power_law_1.01,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,power_law_1.2,0.11189759969711303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,power_law_1.01,0.09125760197639465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,power_law_1.01,0.9083711624145507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,power_law_1.2,0.08609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,power_law_1.2,0.09312000274658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,power_law_1.01,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,power_law_1.01,1.0572544097900392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,power_law_1.2,0.07541760206222534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,power_law_1.01,0.06238719820976257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,power_law_1.01,1.6628543853759765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,power_law_1.2,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,power_law_1.01,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,power_law_1.01,3.3319358825683594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,power_law_1.2,0.06847360134124755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,power_law_1.01,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,power_law_1.2,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,power_law_1.01,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,power_law_1.2,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,power_law_1.01,0.07223680019378662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,power_law_1.01,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,power_law_1.2,0.07010560035705567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,power_law_1.01,0.07446399927139283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,power_law_1.2,0.07504000067710877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,power_law_1.01,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,power_law_1.2,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,power_law_1.01,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,power_law_1.2,0.07114880084991455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,power_law_1.01,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,power_law_1.01,0.0822655975818634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,power_law_1.2,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,power_law_1.01,0.09348480105400085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,power_law_1.01,0.08266239762306213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,power_law_1.2,0.08158079981803894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,power_law_1.01,0.0889792025089264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,power_law_1.01,0.09290879964828491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,power_law_1.2,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,power_law_1.01,0.05928320288658142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,power_law_1.2,0.09142400026321411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,power_law_1.01,0.061312001943588254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,power_law_1.01,0.10228480100631714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,power_law_1.2,0.09388160109519958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,power_law_1.01,0.06521599888801574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,power_law_1.01,0.1193343997001648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,power_law_1.2,0.10453120470046998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,power_law_1.01,0.07054719924926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,power_law_1.01,0.1256832003593445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,power_law_1.2,0.11906559467315674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,power_law_1.01,0.0742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,power_law_1.01,0.15679999589920043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,power_law_1.2,0.13320959806442262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,power_law_1.01,0.07648000121116638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,power_law_1.01,0.1780992031097412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,power_law_1.2,0.16290559768676757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,power_law_1.01,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,power_law_1.01,0.23176319599151612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,power_law_1.01,0.07722880244255066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,power_law_1.2,0.18480639457702636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,power_law_1.01,0.27927680015563966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,power_law_1.01,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,power_law_1.2,0.24051198959350586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,power_law_1.01,0.3693887948989868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,power_law_1.2,0.28720641136169434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,power_law_1.01,0.4879615783691406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,power_law_1.01,0.0906175971031189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,power_law_1.01,0.6867968082427979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,power_law_1.2,0.39801599979400637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,power_law_1.01,0.09655680060386658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,power_law_1.2,0.5178112030029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,power_law_1.01,0.8797504425048828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,power_law_1.01,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,power_law_1.2,0.7695104122161865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,power_law_1.01,1.0552639961242676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,power_law_1.01,0.10863360166549682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,power_law_1.2,0.9243328094482421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,power_law_1.01,1.6227584838867188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,power_law_1.01,0.12543359994888306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,power_law_1.2,1.1707072257995605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,power_law_1.01,0.12951680421829223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,power_law_1.01,3.3449214935302733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,power_law_1.01,0.1561344027519226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,power_law_1.2,1.9079872131347657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,power_law_1.01,0.1852288007736206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,power_law_1.2,3.7139328002929686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,power_law_1.01,0.23255679607391358
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,power_law_1.01,0.2857984066009521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,power_law_1.01,0.37650558948516843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,power_law_1.01,0.48538880348205565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,power_law_1.2,0.07195519804954528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,power_law_1.01,0.7035647869110108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,power_law_1.2,0.09043840169906617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,power_law_1.01,0.8707008361816406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,power_law_1.2,0.07263360023498536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,power_law_1.01,1.0683263778686523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,power_law_1.01,0.07319679856300354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,power_law_1.01,1.6329536437988281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,power_law_1.2,0.05849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,power_law_1.01,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,power_law_1.2,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,power_law_1.01,3.2160640716552735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,power_law_1.01,0.09019520282745361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,power_law_1.2,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,power_law_1.01,0.05987840294837952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,power_law_1.2,0.07222399711608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,power_law_1.2,0.07324159741401673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,power_law_1.01,0.06624000072479248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,power_law_1.2,0.07733759880065919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,power_law_1.01,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,power_law_1.2,0.07815679907798767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,power_law_1.01,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,power_law_1.2,0.08328319787979126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,power_law_1.01,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,power_law_1.2,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,power_law_1.01,0.0803712010383606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,power_law_1.2,0.07301120162010193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,power_law_1.2,0.08820480108261108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,power_law_1.01,0.0862335979938507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,power_law_1.2,0.07566720247268677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,power_law_1.2,0.09658880233764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,power_law_1.01,0.08795520067214965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,power_law_1.2,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,power_law_1.2,0.0980288028717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,power_law_1.01,0.08775039911270141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,power_law_1.2,0.10416640043258667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,power_law_1.01,0.09592959880828858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,power_law_1.2,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,power_law_1.2,0.12240639925003052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,power_law_1.01,0.10576000213623046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,power_law_1.2,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,power_law_1.2,0.1391808032989502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,power_law_1.01,0.10823680162429809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,power_law_1.2,0.0713599979877472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,power_law_1.2,0.1670464038848877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,power_law_1.01,0.10984959602355956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,power_law_1.2,0.07874559760093688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,power_law_1.2,0.18629759550094604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,power_law_1.01,0.12705279588699342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,power_law_1.2,0.08037760257720947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,power_law_1.2,0.242195200920105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,power_law_1.01,0.1372928023338318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,power_law_1.2,0.08303999900817871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,power_law_1.2,0.289305591583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,power_law_1.01,0.16309759616851807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,power_law_1.2,0.08485760092735291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,power_law_1.2,0.399616003036499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,power_law_1.01,0.19218560457229614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,power_law_1.2,0.08814079761505127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,power_law_1.2,0.5023039817810059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,power_law_1.01,0.251366400718689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,power_law_1.2,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,power_law_1.2,0.7437568187713623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,power_law_1.01,0.2968319892883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,power_law_1.2,0.09696639776229858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,power_law_1.2,0.9440511703491211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,power_law_1.01,0.3988095998764038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,power_law_1.2,0.10697599649429321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,power_law_1.2,1.158067226409912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,power_law_1.01,0.5202816009521485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,power_law_1.2,0.10945279598236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,power_law_1.2,1.7624256134033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,power_law_1.2,0.115392005443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,power_law_1.01,0.740006399154663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,power_law_1.2,3.6054271697998046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,power_law_1.2,0.131167995929718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,power_law_1.01,0.9140992164611816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,power_law_1.2,0.1393407940864563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,power_law_1.01,1.1412223815917968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,power_law_1.2,0.1754047989845276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,power_law_1.01,1.748454475402832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,power_law_1.2,0.20264320373535155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,power_law_1.2,0.2650943994522095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,power_law_1.01,3.447462463378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,power_law_1.2,0.31283841133117674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,power_law_1.2,0.4289408206939697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,power_law_1.2,0.5473216056823731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,power_law_1.2,0.7715583801269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,power_law_1.01,0.06689280271530151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,power_law_1.2,0.9824704170227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,power_law_1.01,0.06812800168991089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,power_law_1.01,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,power_law_1.2,1.1989888191223144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,power_law_1.01,0.05685120224952698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,power_law_1.2,1.875040054321289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,power_law_1.2,0.062745600938797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,power_law_1.2,3.7167743682861327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,power_law_1.01,0.07427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,power_law_1.2,0.07115520238876342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,power_law_1.01,0.07897599935531616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,power_law_1.2,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,power_law_1.01,0.08655359745025634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,power_law_1.2,0.060089600086212155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,power_law_1.01,0.08839679956436157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,power_law_1.01,0.09453439712524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,power_law_1.01,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,power_law_1.2,0.07134079933166504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,power_law_1.01,0.10068479776382447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,power_law_1.2,0.07769600152969361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,power_law_1.01,0.1004863977432251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,power_law_1.2,0.08549119830131531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,power_law_1.01,0.10417280197143555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,power_law_1.2,0.09101439714431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,power_law_1.01,0.11338880062103271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,power_law_1.2,0.09178879857063293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,power_law_1.01,0.1178879976272583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,power_law_1.2,0.09859200119972229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,power_law_1.01,0.12730239629745482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,power_law_1.2,0.10044159889221191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,power_law_1.01,0.0701312005519867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,power_law_1.2,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,power_law_1.01,0.14184319972991943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,power_law_1.2,0.10472960472106933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,power_law_1.01,0.07075200080871583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,power_law_1.2,0.11298559904098511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,power_law_1.01,0.15762560367584227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,power_law_1.2,0.1049407958984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,power_law_1.01,0.08406400084495544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,power_law_1.01,0.19305599927902223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,power_law_1.2,0.12974720001220702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,power_law_1.2,0.11066880226135253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,power_law_1.01,0.06358399987220764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,power_law_1.01,0.21823999881744385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,power_law_1.2,0.13059840202331544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,power_law_1.2,0.11804800033569336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,power_law_1.01,0.0742464005947113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,power_law_1.01,0.28316800594329833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,power_law_1.2,0.16314879655838013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,power_law_1.2,0.1254207968711853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,power_law_1.01,0.08692479729652405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,power_law_1.01,0.34396159648895264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,power_law_1.2,0.19224319458007813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,power_law_1.2,0.14835840463638306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,power_law_1.01,0.09348480105400085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,power_law_1.01,0.4715904235839844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,power_law_1.2,0.24651520252227782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,power_law_1.2,0.16248960494995118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,power_law_1.01,0.10535680055618286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,power_law_1.01,0.5776639938354492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,power_law_1.2,0.19402240514755248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,power_law_1.2,0.3063040018081665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,power_law_1.01,0.11068160533905029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,power_law_1.2,0.21921279430389404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,power_law_1.2,0.4185472011566162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,power_law_1.01,0.8277376174926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,power_law_1.01,0.1115455985069275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,power_law_1.2,0.2999039888381958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,power_law_1.2,0.5899648189544677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,power_law_1.01,1.0415424346923827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,power_law_1.01,0.11642240285873413
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,power_law_1.2,0.35726079940795896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,power_law_1.2,0.824454402923584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,power_law_1.01,1.2764415740966797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,power_law_1.01,0.11969920396804809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,power_law_1.2,0.4907711982727051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,power_law_1.2,1.008345603942871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,power_law_1.01,1.9657983779907227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,power_law_1.01,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,power_law_1.2,0.6038335800170899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,power_law_1.2,1.2944767951965332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,power_law_1.01,0.14837119579315186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,power_law_1.01,3.9728321075439452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,power_law_1.2,0.8870656013488769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,power_law_1.2,2.0567359924316406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,power_law_1.01,0.1569599986076355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,power_law_1.2,1.0887871742248536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,power_law_1.01,0.1737663984298706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,power_law_1.2,4.386956787109375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,power_law_1.2,1.30383358001709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,power_law_1.01,0.1561535954475403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,power_law_1.2,2.0951744079589845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,power_law_1.01,0.18052480220794678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,power_law_1.01,0.19405440092086793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,8,power_law_1.01,0.01754239946603775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,power_law_1.2,4.320339202880859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,power_law_1.01,0.23887999057769777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,8,power_law_1.01,0.017759999632835387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,8,power_law_1.01,0.017759999632835387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,power_law_1.01,0.278604793548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,8,power_law_1.01,0.01733759939670563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,power_law_1.01,0.3590912103652954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,8,power_law_1.01,0.01774719953536987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,14336,2,8,16,8,power_law_1.2,0.018719999492168425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,8,power_law_1.01,0.018559999763965607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,power_law_1.01,0.45024638175964354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,14336,2,8,16,8,power_law_1.2,0.017900800704956053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,8,power_law_1.01,0.019180800020694732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,14336,2,8,16,8,power_law_1.2,0.019040000438690186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,power_law_1.01,0.5935999870300293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,8,power_law_1.01,0.019398400187492372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,14336,2,8,16,8,power_law_1.2,0.01770240068435669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,8,power_law_1.01,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,power_law_1.01,0.7515007972717285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,14336,2,8,16,8,power_law_1.2,0.018918399512767792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,power_law_1.2,0.06730239987373351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,8,power_law_1.01,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,14336,2,8,16,8,power_law_1.2,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,power_law_1.01,1.023481559753418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,power_law_1.2,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,8,power_law_1.01,0.021849599480628968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,14336,2,8,16,8,power_law_1.2,0.01932799965143204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,8,power_law_1.01,0.024915200471878052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,power_law_1.2,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,power_law_1.01,1.2837632179260254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,14336,2,8,16,8,power_law_1.2,0.01973759979009628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,8,power_law_1.01,0.02512640058994293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,14336,2,8,16,8,power_law_1.2,0.021376000344753267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,8,power_law_1.01,0.02675839960575104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,power_law_1.01,1.5686400413513184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,14336,2,8,16,8,power_law_1.2,0.02096640020608902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,8,power_law_1.01,0.02800000011920929
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,power_law_1.2,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,14336,2,8,16,8,power_law_1.2,0.02178560048341751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,power_law_1.01,2.5045696258544923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,8,power_law_1.01,0.029228800535202028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,14336,2,8,16,8,power_law_1.2,0.025887998938560485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,power_law_1.2,0.08305919766426087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,8,power_law_1.01,0.029811200499534608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,14336,2,8,16,8,power_law_1.2,0.025068798661231996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,power_law_1.01,4.692460632324218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,8,power_law_1.01,0.03985919952392578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,power_law_1.2,0.09023360013961793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,14336,2,8,16,8,power_law_1.2,0.02710399925708771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,8,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,14336,2,8,16,8,power_law_1.2,0.029785600304603577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,power_law_1.2,0.10416640043258667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,8,power_law_1.01,0.05278720259666443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,14336,2,8,16,8,power_law_1.2,0.029977598786354066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,8,power_law_1.01,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,power_law_1.2,0.1072383999824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,8,power_law_1.01,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,14336,2,8,16,8,power_law_1.2,0.029996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,8,power_law_1.01,0.03919360041618347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,8,power_law_1.01,0.07631360292434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,power_law_1.2,0.10949759483337403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,14336,2,8,16,8,power_law_1.2,0.03960959911346436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,8,power_law_1.01,0.037567999958992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,8,power_law_1.01,0.09905279874801635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,14336,2,8,16,8,power_law_1.2,0.04103679955005646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,8,power_law_1.01,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,power_law_1.2,0.11706880331039429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,8,power_law_1.01,0.1326464056968689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,14336,2,8,16,8,power_law_1.2,0.052095997333526614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,8,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,8,power_law_1.01,0.17503999471664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,power_law_1.2,0.12158080339431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,8,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,14336,2,8,16,8,power_law_1.2,0.06051200032234192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,8,power_law_1.01,0.25756158828735354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,8,power_law_1.01,0.038387200236320494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,14336,2,8,16,8,power_law_1.2,0.08384640216827392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,power_law_1.2,0.12341120243072509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,8,power_law_1.01,0.3443903923034668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,8,power_law_1.01,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,14336,2,8,16,8,power_law_1.2,0.09552000164985656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,power_law_1.2,0.13100160360336305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,8,power_law_1.01,0.39682559967041015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,8,power_law_1.01,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,14336,2,8,16,8,power_law_1.2,0.14017280340194702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,8,power_law_1.01,0.03962239921092987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,power_law_1.2,0.1404096007347107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,8,power_law_1.01,0.66593918800354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,14336,2,8,16,8,power_law_1.2,0.16595840454101562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,8,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,14336,2,8,16,8,power_law_1.2,0.26856958866119385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,8,power_law_1.01,1.241215991973877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,power_law_1.2,0.14675840139389038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,8,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,14336,2,8,16,8,power_law_1.2,0.342905592918396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,power_law_1.2,0.1541440010070801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,8,power_law_1.01,0.04023680090904236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,14336,2,8,16,8,power_law_1.2,0.43364481925964354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,8,power_law_1.01,0.041465601325035094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,14336,2,8,16,8,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,power_law_1.2,0.18586879968643188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,14336,2,8,16,8,power_law_1.2,0.5907199859619141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,8,power_law_1.01,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,14336,2,8,16,8,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,power_law_1.2,0.20555520057678223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,14336,2,8,16,8,power_law_1.2,1.3218560218811035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,8,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,14336,2,8,16,8,power_law_1.2,0.03516159951686859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,8,power_law_1.01,0.04924800097942352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,14336,2,8,16,8,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,power_law_1.2,0.2411776065826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,8,power_law_1.01,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,14336,2,8,16,8,power_law_1.2,0.03639039993286133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,power_law_1.2,0.2837696075439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,8,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,14336,2,8,16,8,power_law_1.2,0.03720960021018982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,8,power_law_1.01,0.06788480281829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,8,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,14336,2,8,16,8,power_law_1.2,0.03705599904060364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,power_law_1.2,0.3708224058151245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,8,power_law_1.01,0.07750399708747864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,8,power_law_1.01,0.019334399700164796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,14336,2,8,16,8,power_law_1.2,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,power_law_1.2,0.4535679817199707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,8,power_law_1.01,0.1045375943183899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,8,power_law_1.01,0.01932799965143204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,14336,2,8,16,8,power_law_1.2,0.03823359906673431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,8,power_law_1.01,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,8,power_law_1.01,0.019724799692630766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,14336,2,8,16,8,power_law_1.2,0.03863039910793305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,power_law_1.2,0.6079743862152099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,8,power_law_1.01,0.1463039994239807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,8,power_law_1.01,0.01913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,14336,2,8,16,8,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,power_law_1.2,0.7941504001617432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,8,power_law_1.01,0.18727680444717407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,8,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,14336,2,8,16,8,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,8,power_law_1.01,0.2667263984680176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,8,power_law_1.01,0.021184000372886657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,14336,2,8,16,8,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,power_law_1.2,1.045638370513916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,8,power_law_1.01,0.3306368112564087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,8,power_law_1.01,0.021996800601482392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,14336,2,8,16,8,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,power_law_1.2,1.319052791595459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,8,power_law_1.01,0.022809599339962006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,14336,2,8,16,8,power_law_1.2,0.0448063999414444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,8,power_law_1.01,0.4135744094848633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,8,power_law_1.01,0.023423999547958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,14336,2,8,16,8,power_law_1.2,0.046419200301170346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,8,power_law_1.01,0.6822847843170166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,power_law_1.2,1.6960895538330079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,8,power_law_1.01,0.024460799992084503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,14336,2,8,16,8,power_law_1.2,0.04948480129241943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,8,power_law_1.01,1.343564796447754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,14336,2,8,16,8,power_law_1.2,0.053990399837493895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,8,power_law_1.01,0.0285504013299942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,power_law_1.2,2.6205440521240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,8,power_law_1.01,0.028960001468658448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,14336,2,8,16,8,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,8,power_law_1.01,0.03059200048446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,14336,2,8,16,8,power_law_1.2,0.06936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,power_law_1.2,5.190777587890625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,8,power_law_1.01,0.03200640082359314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,14336,2,8,16,8,power_law_1.2,0.08122239708900451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,16,8,power_law_1.2,0.0201664000749588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,8,power_law_1.01,0.0326335996389389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,14336,2,8,16,8,power_law_1.2,0.10295039415359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,16,8,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,8,power_law_1.01,0.03592959940433502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,14336,2,8,16,8,power_law_1.2,0.11155840158462524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,8,power_law_1.01,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,16,8,power_law_1.2,0.019750399887561797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,8,power_law_1.01,0.04718720018863678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,14336,2,8,16,8,power_law_1.2,0.15496959686279296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,16,8,power_law_1.2,0.020153599977493285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,8,power_law_1.01,0.03904640078544617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,8,power_law_1.01,0.052095997333526614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,14336,2,8,16,8,power_law_1.2,0.18956799507141114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,16,8,power_law_1.2,0.020761600136756896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,8,power_law_1.01,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,8,power_law_1.01,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,14336,2,8,16,8,power_law_1.2,0.2632960081100464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,16,8,power_law_1.2,0.021184000372886657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,8,power_law_1.01,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,8,power_law_1.01,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,14336,2,8,16,8,power_law_1.2,0.3546432018280029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,16,8,power_law_1.2,0.020985600352287293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,8,power_law_1.01,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,8,power_law_1.01,0.11354880332946778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,16,8,power_law_1.2,0.022623999416828154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,14336,2,8,16,8,power_law_1.2,0.43308157920837403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,8,power_law_1.01,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,8,power_law_1.01,0.13852800130844117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,16,8,power_law_1.2,0.023027199506759643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,8,power_law_1.01,0.04068480134010315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,14336,2,8,16,8,power_law_1.2,0.6860095977783203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,16,8,power_law_1.2,0.023647999763488768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,8,power_law_1.01,0.039654400944709775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,14336,2,8,16,8,power_law_1.2,1.3579584121704102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,16,8,power_law_1.2,0.025062400102615356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,8,power_law_1.01,0.03945600092411041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,16,8,power_law_1.2,0.02937600016593933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,8,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,16,8,power_law_1.2,0.029529601335525513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,8,power_law_1.01,0.04128639996051788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,16,8,power_law_1.2,0.03741439878940582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,16,8,power_law_1.2,0.031225600838661195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,8,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,16,8,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,16,8,power_law_1.2,0.0328575998544693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,8,power_law_1.01,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,16,8,power_law_1.2,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,16,8,power_law_1.2,0.03325439989566803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,8,power_law_1.01,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,16,8,power_law_1.2,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,16,8,power_law_1.2,0.03450239896774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,8,power_law_1.01,0.048665601015090945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,16,8,power_law_1.2,0.039468801021575926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,16,8,power_law_1.2,0.05006080269813538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,8,power_law_1.01,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,16,8,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,16,8,power_law_1.2,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,8,power_law_1.01,0.054611200094223024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,16,8,power_law_1.2,0.039263999462127684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,16,8,power_law_1.2,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,8,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,16,8,power_law_1.2,0.04069760143756866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,16,8,power_law_1.2,0.0889792025089264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,8,power_law_1.01,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,16,8,power_law_1.2,0.04110080003738403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,16,8,power_law_1.2,0.12277120351791382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,8,power_law_1.01,0.08471680283546448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,16,8,power_law_1.2,0.04131200015544891
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,16,8,power_law_1.2,0.14876799583435057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,8,power_law_1.01,0.0957759976387024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,16,8,power_law_1.2,0.04111360013484955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,8,power_law_1.2,0.21840639114379884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,16,8,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,8,power_law_1.01,0.12095999717712402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,8,power_law_1.2,0.2755392074584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,16,8,power_law_1.2,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,8,power_law_1.01,0.14410239458084106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,8,power_law_1.2,0.37344000339508054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,16,8,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,8,power_law_1.01,0.2035072088241577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,8,power_law_1.2,0.495692777633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,16,8,power_law_1.2,0.048876801133155824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,8,power_law_1.01,0.2407680034637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,8,power_law_1.2,0.6412928104400635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,16,8,power_law_1.2,0.049907198548316954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,8,power_law_1.01,0.33293440341949465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,8,power_law_1.2,1.0111935615539551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,16,8,power_law_1.2,0.05355520248413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,8,power_law_1.01,0.43471360206604004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,16,8,power_law_1.2,0.06343039870262146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,8,power_law_1.2,1.8811647415161132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,8,power_law_1.01,0.5510335922241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,16,8,power_law_1.2,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,8,power_law_1.01,0.8740032196044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,16,8,power_law_1.2,0.0847104012966156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,8,power_law_1.01,1.592454433441162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,16,8,power_law_1.2,0.09584640264511109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,4,power_law_1.01,0.019756799936294554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,16,8,power_law_1.2,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,4,power_law_1.01,0.020160000026226043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,16,8,power_law_1.2,0.15249919891357422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,4,power_law_1.01,0.019756799936294554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,16,8,power_law_1.2,0.2067647933959961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,4,power_law_1.2,0.019174399971961974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,4,power_law_1.01,0.01976960003376007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,16,8,power_law_1.2,0.24280960559844972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,4,power_law_1.2,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,4,power_law_1.01,0.019750399887561797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,16,8,power_law_1.2,0.3472831964492798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,4,power_law_1.01,0.01995519995689392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,4,power_law_1.2,0.01875839978456497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,16,8,power_law_1.2,0.4502848148345947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,4,power_law_1.01,0.0211776003241539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,4,power_law_1.2,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,4,power_law_1.01,0.021376000344753267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,16,8,power_law_1.2,0.545305585861206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,4,power_law_1.2,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,4,power_law_1.01,0.022412799298763275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,4,power_law_1.2,0.019993600249290467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,16,8,power_law_1.2,0.8686911582946777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,4,power_law_1.01,0.02343039959669113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,4,power_law_1.2,0.020608000457286835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,16,8,power_law_1.2,1.7030527114868164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,4,power_law_1.01,0.02426239997148514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,4,power_law_1.2,0.020812800526618956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,4,power_law_1.01,0.030399999022483824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,4,power_law_1.2,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,4,power_law_1.01,0.02958720028400421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,4,power_law_1.2,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,4,power_law_1.01,0.04110080003738403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,4,power_law_1.01,0.029580798745155335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,4,power_law_1.2,0.023475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,4,power_law_1.01,0.04151679873466492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,4,power_law_1.01,0.030611199140548707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,4,power_law_1.2,0.028198400139808656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,4,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,4,power_law_1.01,0.031615999341011045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,4,power_law_1.2,0.028595200181007384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,4,power_law_1.01,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,4,power_law_1.01,0.03367680013179779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,4,power_law_1.2,0.029414400458335876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,4,power_law_1.01,0.040870401263237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,4,power_law_1.01,0.03715839982032776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,4,power_law_1.2,0.030246400833129884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,4,power_law_1.01,0.04111360013484955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,4,power_law_1.01,0.04309119880199432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,4,power_law_1.2,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,4,power_law_1.01,0.04152320027351379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,4,power_law_1.01,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,4,power_law_1.2,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,4,power_law_1.01,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,4,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,4,power_law_1.2,0.03575679957866669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,4,power_law_1.01,0.042316800355911253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,4,power_law_1.01,0.0996288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,4,power_law_1.2,0.039647999405860904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,4,power_law_1.01,0.042534399032592776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,4,power_law_1.01,0.11703679561614991
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,4,power_law_1.2,0.05870720148086548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,4,power_law_1.01,0.042745599150657655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,4,power_law_1.01,0.17497600317001344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,4,power_law_1.2,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,4,power_law_1.01,0.044582399725914004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,4,power_law_1.01,0.2011967897415161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,4,power_law_1.2,0.09456639885902404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,4,power_law_1.01,0.04497919976711273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,4,power_law_1.01,0.31775360107421874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,4,power_law_1.01,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,4,power_law_1.2,0.11665920019149781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,4,power_law_1.01,0.3797760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,4,power_law_1.01,0.052767997980117796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,4,power_law_1.2,0.1629439949989319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,4,power_law_1.01,0.49898881912231446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,4,power_law_1.01,0.055430400371551516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,4,power_law_1.2,0.19876480102539062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,4,power_law_1.01,0.7236480236053466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,4,power_law_1.01,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,4,power_law_1.2,0.2913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,4,power_law_1.01,1.423846435546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,4,power_law_1.01,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,4,power_law_1.2,0.3734656095504761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,4,power_law_1.01,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,4,power_law_1.2,0.45847039222717284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,4,power_law_1.01,0.08636800050735474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,4,power_law_1.2,0.7199999809265136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,4,power_law_1.2,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,4,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,4,power_law_1.2,0.04207360148429871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,4,power_law_1.2,1.4161215782165528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,4,power_law_1.01,0.11975040435791015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,4,power_law_1.2,0.041254401206970215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,4,power_law_1.01,0.15475200414657592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,4,power_law_1.2,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,4,power_law_1.01,0.21495680809020995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,4,power_law_1.2,0.042259201407432556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,4,power_law_1.01,0.2534656047821045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,4,power_law_1.2,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,4,power_law_1.01,0.3685695886611938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,4,power_law_1.2,0.04185599982738495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,128,power_law_1.01,0.0212351992726326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,4,power_law_1.01,0.4482367992401123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,4,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,128,power_law_1.01,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,4,power_law_1.01,0.6663296222686768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,4,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,4,power_law_1.01,0.9723199844360352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,128,power_law_1.01,0.020812800526618956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,4,power_law_1.2,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,4,power_law_1.2,0.043507200479507444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,4,power_law_1.01,1.7411455154418944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,128,power_law_1.01,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,4,power_law_1.2,0.044531199336051944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,128,power_law_1.01,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,4,power_law_1.2,0.04597119987010956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,4,power_law_1.2,0.046777600049972536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,128,power_law_1.01,0.025523200631141663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,4,power_law_1.2,0.0531328022480011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,128,power_law_1.01,0.032691198587417605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,4,power_law_1.2,0.052928000688552856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,128,power_law_1.2,0.021216000616550445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,128,power_law_1.01,0.03309440016746521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,4,power_law_1.2,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,128,power_law_1.2,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,4,power_law_1.2,0.06542720198631287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,128,power_law_1.01,0.03883520066738129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,4,power_law_1.2,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,128,power_law_1.2,0.020614400506019592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,128,power_law_1.01,0.040870401263237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,4,power_law_1.2,0.0893887996673584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,128,power_law_1.2,0.02143999934196472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,128,power_law_1.01,0.047443199157714847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,4,power_law_1.2,0.10413440465927123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,128,power_law_1.2,0.022867199778556824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,4,power_law_1.2,0.13935359716415405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,128,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,128,power_law_1.2,0.025753599405288697
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,4,power_law_1.2,0.1721343994140625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,128,power_law_1.01,0.06033920049667359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,4,power_law_1.2,0.24236159324645995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,128,power_law_1.2,0.03187839984893799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,128,power_law_1.01,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,4,power_law_1.2,0.2806463956832886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,128,power_law_1.2,0.03329919874668121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,4,power_law_1.2,0.4600512027740479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,128,power_law_1.01,0.057043200731277464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,128,power_law_1.2,0.039052799344062805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,4,power_law_1.2,0.5366720199584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,128,power_law_1.01,0.06402559876441956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,128,power_law_1.2,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,4,power_law_1.2,0.6544191837310791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,128,power_law_1.01,0.07651839852333069
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,128,power_law_1.2,0.047244799137115476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,4,power_law_1.2,1.0066816329956054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,128,power_law_1.01,0.06995840072631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,128,power_law_1.2,0.05379199981689453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,4,power_law_1.2,2.054649543762207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.01,0.08483200073242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,128,power_law_1.2,0.05994240045547485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.01,0.11994240283966065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,128,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.01,0.15025919675827026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,128,power_law_1.2,0.056467199325561525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,128,power_law_1.01,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,128,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.01,0.21577599048614501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,128,power_law_1.01,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,128,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.01,0.2805056095123291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,128,power_law_1.2,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.01,0.4050303936004639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.2,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.01,0.5338240146636963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.2,0.12728960514068605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.01,0.7748928070068359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.2,0.15024640560150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.01,1.034169578552246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.2,0.21456000804901124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,128,power_law_1.01,1.2969280242919923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.2,0.28153600692749026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,128,power_law_1.01,2.0493568420410155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.2,0.4093183994293213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.2,0.5383488178253174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,128,power_law_1.01,4.129497528076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.2,0.8011072158813477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.2,1.0476927757263184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,128,power_law_1.2,1.3014016151428223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,128,power_law_1.2,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,128,power_law_1.2,0.060127997398376466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,128,power_law_1.2,2.0632255554199217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,128,power_law_1.2,0.05975040197372437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,128,power_law_1.2,4.11272964477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,128,power_law_1.2,0.056857597827911374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,128,power_law_1.2,0.05685120224952698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,128,power_law_1.2,0.05885440111160278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,128,power_law_1.2,0.05931519865989685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,128,power_law_1.2,0.060127997398376466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,64,power_law_1.01,0.020422400534152986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,128,power_law_1.2,0.060755199193954466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,64,power_law_1.01,0.02062080055475235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,128,power_law_1.2,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,64,power_law_1.01,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,128,power_law_1.2,0.06402559876441956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,64,power_law_1.01,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,64,power_law_1.01,0.0243136003613472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,128,power_law_1.2,0.06506239771842956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,64,power_law_1.01,0.02573440074920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,128,power_law_1.2,0.06583679914474487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,64,power_law_1.01,0.03411200046539307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,128,power_law_1.2,0.06627839803695679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,16,8,power_law_1.01,0.21265919208526612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,64,power_law_1.01,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,128,power_law_1.2,0.07528319954872131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,16,8,power_law_1.01,0.2671360015869141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,64,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,128,power_law_1.2,0.07631360292434693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,16,8,power_law_1.01,0.38940160274505614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,16,8,power_law_1.01,0.49611520767211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,64,power_law_1.01,0.043136000633239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,128,power_law_1.2,0.08081920146942138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,16,8,power_law_1.01,0.6263552188873291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,64,power_law_1.01,0.050521600246429446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,128,power_law_1.2,0.09721599817276001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,16,8,power_law_1.01,0.9919232368469239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,64,power_law_1.01,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.2,0.10825599431991577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,16,8,power_law_1.01,1.6698175430297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,64,power_law_1.01,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.2,0.13140480518341063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,64,power_law_1.01,0.07754240036010743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.2,0.14199039936065674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,64,power_law_1.01,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.2,0.19073920249938964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,64,power_law_1.01,0.0703935980796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.2,0.21639039516448974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,64,power_law_1.01,0.08389120101928711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.2,0.2880768060684204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,64,power_law_1.2,0.02423679977655411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,64,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.2,0.40010881423950195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,64,power_law_1.2,0.02383359968662262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,64,power_law_1.01,0.09416319727897644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,64,power_law_1.2,0.023391999304294586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.2,0.5293375968933105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,64,power_law_1.01,0.12896000146865844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,64,power_law_1.2,0.023839999735355378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,64,power_law_1.01,0.15865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.2,0.7366975784301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,64,power_law_1.2,0.026495999097824095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,64,power_law_1.01,0.23031680583953856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,128,power_law_1.2,1.0452223777770997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,64,power_law_1.2,0.02752000093460083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,64,power_law_1.01,0.28624639511108396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,128,power_law_1.2,1.5236288070678712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,64,power_law_1.2,0.031001600623130798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,64,power_law_1.01,0.4178368091583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,64,power_law_1.2,0.034892800450325015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,128,power_law_1.2,3.248051071166992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,64,power_law_1.01,0.5539135932922363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,64,power_law_1.2,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,64,power_law_1.01,0.8297920227050781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,64,power_law_1.2,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,64,power_law_1.01,1.0708288192749023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,64,power_law_1.01,0.08798720240592957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,64,power_law_1.2,0.04513919949531555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,64,power_law_1.01,1.3759872436523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,64,power_law_1.01,0.07160320281982421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,64,power_law_1.2,0.05271040201187134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,64,power_law_1.01,2.1771583557128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,64,power_law_1.01,0.059513598680496216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,64,power_law_1.2,0.05496320128440857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,64,power_law_1.01,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,64,power_law_1.2,0.07196159958839417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,64,power_law_1.01,4.369126510620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,64,power_law_1.01,0.05911679863929749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,64,power_law_1.2,0.05619199872016907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,64,power_law_1.01,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,64,power_law_1.2,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,64,power_law_1.01,0.06239359974861145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,64,power_law_1.2,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,64,power_law_1.2,0.07857919931411743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,64,power_law_1.01,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,64,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,64,power_law_1.2,0.07715200185775757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,64,power_law_1.2,0.0574783980846405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,64,power_law_1.01,0.06321280002593994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,64,power_law_1.2,0.0832256019115448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,64,power_law_1.2,0.058905601501464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,64,power_law_1.01,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,64,power_law_1.2,0.10738559961318969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,64,power_law_1.2,0.05666559934616089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,64,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,64,power_law_1.2,0.1561344027519226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,64,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,64,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,64,power_law_1.2,0.2071295976638794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,64,power_law_1.2,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,64,power_law_1.01,0.06709120273590088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,64,power_law_1.2,0.2806463956832886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,64,power_law_1.2,0.06424319744110107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,64,power_law_1.01,0.07037439942359924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,64,power_law_1.2,0.4133632183074951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,64,power_law_1.2,0.06321920156478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,64,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,64,power_law_1.2,0.5653247833251953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,64,power_law_1.2,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,64,power_law_1.01,0.07571200132369996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,64,power_law_1.2,0.8256383895874023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,64,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,64,power_law_1.01,0.08042240142822266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,64,power_law_1.2,1.093721580505371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,64,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,64,power_law_1.01,0.09127680063247681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,64,power_law_1.2,1.3083328247070312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,64,power_law_1.2,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,64,power_law_1.01,0.10396800041198731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,64,power_law_1.2,2.1820095062255858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,64,power_law_1.2,0.06851199865341187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,64,power_law_1.01,0.12485120296478272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,64,power_law_1.2,0.0756991982460022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,64,power_law_1.01,0.13999999761581422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,64,power_law_1.2,5.272851181030274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,64,power_law_1.2,0.07919999957084656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,64,power_law_1.01,0.17599999904632568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,64,power_law_1.2,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,64,power_law_1.01,0.20350079536437987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,64,power_law_1.2,0.0980288028717041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,64,power_law_1.01,0.2682111978530884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,64,power_law_1.2,0.10848000049591064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,64,power_law_1.01,0.3304640054702759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,32,power_law_1.01,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,64,power_law_1.2,0.13141119480133057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,64,power_law_1.01,0.46666879653930665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,32,power_law_1.01,0.02261119931936264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,64,power_law_1.2,0.15291520357131957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,32,power_law_1.01,0.022201600670814513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,64,power_law_1.01,0.6005951881408691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,64,power_law_1.2,0.19818880558013915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,32,power_law_1.01,0.021996800601482392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,64,power_law_1.2,0.2182528018951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,64,power_law_1.01,0.7437632083892822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,32,power_law_1.01,0.02343679964542389
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,64,power_law_1.2,0.31348481178283694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,64,power_law_1.01,1.1744576454162599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,32,power_law_1.01,0.025068798661231996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,64,power_law_1.2,0.38414080142974855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,64,power_law_1.01,2.221388816833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,32,power_law_1.01,0.028339201211929323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,64,power_law_1.2,0.5096767902374267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,32,power_law_1.01,0.030380800366401672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,64,power_law_1.2,0.6839680194854736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,32,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,64,power_law_1.2,0.917024040222168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,32,power_law_1.01,0.04022400081157684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,32,power_law_1.2,0.020000000298023225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,64,power_law_1.2,1.3931903839111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,32,power_law_1.01,0.046367999911308286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,32,power_law_1.2,0.019993600249290467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,32,power_law_1.01,0.04962559938430786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,32,power_law_1.2,0.019980800151824952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,64,power_law_1.2,3.0278783798217774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,32,power_law_1.01,0.05333120226860046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,32,power_law_1.2,0.020396800339221956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,32,power_law_1.01,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,32,power_law_1.2,0.021491199731826782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,32,power_law_1.01,0.055174398422241214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,32,power_law_1.2,0.024710400402545928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,32,power_law_1.01,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,32,power_law_1.01,0.059468799829483034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,32,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,32,power_law_1.2,0.02736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,32,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,32,power_law_1.01,0.057081598043441775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,32,power_law_1.2,0.030643200874328612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,32,power_law_1.01,0.06910719871520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,32,power_law_1.01,0.058303999900817874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,32,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,32,power_law_1.01,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,32,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,32,power_law_1.2,0.04120959937572479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,32,power_law_1.01,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,32,power_law_1.01,0.10248960256576538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,32,power_law_1.2,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,32,power_law_1.01,0.06567040085792542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,32,power_law_1.01,0.11843199729919433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,32,power_law_1.2,0.052153599262237546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,32,power_law_1.01,0.06689280271530151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,32,power_law_1.2,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,32,power_law_1.01,0.17333760261535644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,32,power_law_1.01,0.06567040085792542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,32,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,32,power_law_1.01,0.21921920776367188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,32,power_law_1.01,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,32,power_law_1.2,0.05562880039215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,32,power_law_1.01,0.31875200271606446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,32,power_law_1.01,0.07058560252189636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,32,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,32,power_law_1.01,0.4299583911895752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,32,power_law_1.01,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,32,power_law_1.2,0.07364479899406433
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,32,power_law_1.01,0.6103871822357178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,128,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,32,power_law_1.01,0.07262719869613647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,32,power_law_1.2,0.06894720196723939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,32,power_law_1.01,0.7891583919525147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,128,power_law_1.01,0.05909119844436646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,32,power_law_1.01,0.07140480279922486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,32,power_law_1.2,0.08533120155334473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,32,power_law_1.01,1.006668758392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,128,power_law_1.01,0.05885440111160278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,32,power_law_1.01,0.07959679961204529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,32,power_law_1.2,0.10477440357208252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,32,power_law_1.01,1.639084815979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,128,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,32,power_law_1.01,0.08082559704780579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,32,power_law_1.2,0.12997759580612184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,128,power_law_1.01,0.060915201902389526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,32,power_law_1.01,0.08716800212860107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,32,power_law_1.2,0.18465280532836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,32,power_law_1.01,3.008595275878906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,32,power_law_1.01,0.09843199849128723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,128,power_law_1.01,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,32,power_law_1.2,0.22787199020385743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,32,power_law_1.01,0.10559999942779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,128,power_law_1.01,0.0621504008769989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,32,power_law_1.2,0.33403520584106444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,32,power_law_1.01,0.1351040005683899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,128,power_law_1.01,0.06275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,32,power_law_1.2,0.0725823998451233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,32,power_law_1.2,0.43306879997253417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,128,power_law_1.01,0.06481279730796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,32,power_law_1.01,0.14613120555877684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,32,power_law_1.2,0.06828799843788147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,32,power_law_1.2,0.6372608184814453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,128,power_law_1.01,0.06521599888801574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,32,power_law_1.01,0.18240640163421631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,32,power_law_1.2,0.05783680081367493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,32,power_law_1.2,0.8424639701843262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,128,power_law_1.01,0.065830397605896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,32,power_law_1.01,0.21068799495697021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,32,power_law_1.2,0.06069759726524353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,32,power_law_1.2,1.0468607902526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,128,power_law_1.01,0.06646400094032287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,32,power_law_1.2,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,32,power_law_1.01,0.2817471981048584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,32,power_law_1.2,1.6620800018310546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,128,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,32,power_law_1.2,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,32,power_law_1.01,0.3575103998184204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,128,power_law_1.01,0.07668480277061462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,32,power_law_1.2,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,32,power_law_1.2,3.2922943115234373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,32,power_law_1.01,0.5019008159637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,128,power_law_1.01,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,32,power_law_1.2,0.06765440106391907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,32,power_law_1.01,0.6356287956237793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,128,power_law_1.01,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,32,power_law_1.2,0.0705344021320343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,32,power_law_1.01,0.7310719966888428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,16,power_law_1.01,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.01,0.10700160264968872
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,32,power_law_1.2,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,16,power_law_1.01,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,32,power_law_1.01,1.1514880180358886
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.01,0.12460160255432129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,32,power_law_1.2,0.0713536024093628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,16,power_law_1.01,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.01,0.14303359985351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,32,power_law_1.2,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,32,power_law_1.01,2.4288511276245117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,16,power_law_1.01,0.021836799383163453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.01,0.17745280265808105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,32,power_law_1.2,0.07400959730148315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,16,power_law_1.01,0.023289600014686586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.01,0.20775680541992186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,32,power_law_1.2,0.07545599937438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,16,power_law_1.2,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,16,power_law_1.01,0.02736639976501465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.01,0.26754560470581057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,32,power_law_1.2,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,16,power_law_1.2,0.02162559926509857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,16,power_law_1.01,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,32,power_law_1.2,0.08426240086555481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.01,0.3322688102722168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,16,power_law_1.2,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,16,power_law_1.01,0.03309440016746521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,32,power_law_1.2,0.08671360015869141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.01,0.5010240077972412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,16,power_law_1.2,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,16,power_law_1.01,0.041305598616600034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,32,power_law_1.2,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.01,0.5796671867370605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,16,power_law_1.2,0.02389120012521744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,16,power_law_1.01,0.04478079974651337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,32,power_law_1.2,0.11066880226135253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,128,power_law_1.01,0.7330560207366943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,16,power_law_1.2,0.02696320116519928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,16,power_law_1.01,0.04948480129241943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,32,power_law_1.2,0.13523839712142943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,16,power_law_1.2,0.02983039915561676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,128,power_law_1.01,1.251417636871338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,16,power_law_1.01,0.059724801778793336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,32,power_law_1.2,0.155731201171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,16,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,16,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,128,power_law_1.01,2.2418239593505858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,32,power_law_1.2,0.19546879529953004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,16,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,16,power_law_1.01,0.08144000172615051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,32,power_law_1.2,0.23396480083465576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,16,power_law_1.2,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,16,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,32,power_law_1.2,0.31445119380950926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,16,power_law_1.2,0.049055999517440795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,16,power_law_1.01,0.07811200022697448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,16,power_law_1.01,0.070796799659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,32,power_law_1.2,0.3703552007675171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,16,power_law_1.2,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,16,power_law_1.01,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,16,power_law_1.01,0.08920959830284118
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,16,power_law_1.2,0.06567040085792542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,32,power_law_1.2,0.5284607887268067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,16,power_law_1.01,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,16,power_law_1.01,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,16,power_law_1.2,0.08062719702720642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,32,power_law_1.2,0.6896383762359619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,16,power_law_1.01,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,16,power_law_1.01,0.10684159994125367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,16,power_law_1.2,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,32,power_law_1.2,0.9100159645080567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,16,power_law_1.01,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,16,power_law_1.01,0.11502079963684082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,16,power_law_1.2,0.0703935980796814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,32,power_law_1.2,1.4920512199401856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,16,power_law_1.01,0.07011200189590454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,16,power_law_1.01,0.14513280391693115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,16,power_law_1.2,0.08861439824104309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,16,power_law_1.01,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,16,power_law_1.01,0.20083839893341066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,16,power_law_1.2,0.0849407970905304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,32,power_law_1.2,2.9070016860961916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,16,power_law_1.01,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,16,power_law_1.2,0.10723199844360351
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,16,power_law_1.01,0.2565376043319702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,16,power_law_1.01,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,16,power_law_1.2,0.11564160585403442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,16,power_law_1.01,0.37839360237121583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,16,power_law_1.01,0.07729920148849487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,16,power_law_1.2,0.1453376054763794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,16,power_law_1.2,0.07810559868812561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,16,power_law_1.01,0.48510079383850097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,16,power_law_1.01,0.08038399815559387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,16,power_law_1.2,0.20718719959259033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,16,power_law_1.2,0.08302720189094544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,16,power_law_1.01,0.7171328067779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,16,power_law_1.01,0.07996799945831298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,16,power_law_1.2,0.2569472074508667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,16,power_law_1.2,0.059033602476119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,16,power_law_1.01,0.9432319641113281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,16,power_law_1.01,0.08037760257720947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,16,power_law_1.2,0.06111999750137329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,16,power_law_1.2,0.37798399925231935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,16,power_law_1.01,1.1629823684692382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,16,power_law_1.01,0.08139520287513732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,16,power_law_1.2,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,16,power_law_1.2,0.4854911804199219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,16,power_law_1.01,1.8623743057250977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,16,power_law_1.01,0.08794879913330078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,16,power_law_1.2,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,16,power_law_1.2,0.7171328067779541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,16,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,16,power_law_1.2,0.0729856014251709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,16,power_law_1.01,3.6922367095947264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,16,power_law_1.2,0.9436287879943848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,16,power_law_1.01,0.09757440090179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,16,power_law_1.2,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,16,power_law_1.2,1.1732288360595704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,16,power_law_1.01,0.11148159503936768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,16,power_law_1.2,0.07440000176429748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,16,power_law_1.01,0.12359039783477783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,16,power_law_1.2,1.8607168197631836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,8,power_law_1.01,0.021644799411296843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,16,power_law_1.2,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,16,power_law_1.01,0.14343680143356324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,8,power_law_1.01,0.021836799383163453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,16,power_law_1.2,0.07790079712867737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,16,power_law_1.2,3.703327941894531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,16,power_law_1.01,0.16186879873275756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,8,power_law_1.01,0.022841599583625794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,16,power_law_1.2,0.07954559922218322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,16,power_law_1.01,0.1983423948287964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,8,power_law_1.01,0.02328319996595383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,16,power_law_1.2,0.08198400139808655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,8,power_law_1.01,0.02531839907169342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,16,power_law_1.01,0.23848319053649902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,8,power_law_1.2,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,16,power_law_1.2,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,8,power_law_1.01,0.029407998919486998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,8,power_law_1.2,0.02162559926509857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,16,power_law_1.01,0.3076864004135132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,16,power_law_1.2,0.08977919816970825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,8,power_law_1.01,0.03270399868488312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,8,power_law_1.2,0.022886399924755097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,16,power_law_1.2,0.09100800156593322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,16,power_law_1.01,0.3996416091918945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,8,power_law_1.01,0.036160001158714296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,8,power_law_1.2,0.022867199778556824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,16,power_law_1.2,0.09961599707603455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,16,power_law_1.01,0.54683518409729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,8,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,8,power_law_1.2,0.02593280076980591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,16,power_law_1.2,0.11044479608535766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,16,power_law_1.01,0.6851456165313721
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,8,power_law_1.01,0.0474368005990982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,8,power_law_1.2,0.0286080002784729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,16,power_law_1.2,0.1229375958442688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,16,power_law_1.01,0.8678144454956055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,8,power_law_1.01,0.05440000295639038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,8,power_law_1.2,0.03270399868488312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,16,power_law_1.2,0.141593599319458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,16,power_law_1.01,1.2952447891235352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,8,power_law_1.01,0.059520000219345094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,8,power_law_1.2,0.035571199655532834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,16,power_law_1.2,0.16680320501327514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,8,power_law_1.01,0.07242239713668823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,16,power_law_1.01,2.5406400680541994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,8,power_law_1.2,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,16,power_law_1.2,0.20162560939788818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,8,power_law_1.01,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,8,power_law_1.2,0.04723840057849884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,16,power_law_1.2,0.24645121097564698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,8,power_law_1.01,0.06689280271530151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,8,power_law_1.2,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,16,power_law_1.2,0.325708794593811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,8,power_law_1.01,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,8,power_law_1.2,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,8,power_law_1.01,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,16,power_law_1.2,0.42135038375854494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,8,power_law_1.01,0.09555839896202087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,8,power_law_1.2,0.0677183985710144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,8,power_law_1.01,0.0815999984741211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,16,power_law_1.2,0.6359871864318848
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,8,power_law_1.01,0.09556480050086975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,8,power_law_1.2,0.08370559811592101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,8,power_law_1.01,0.0701312005519867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,16,power_law_1.2,0.7715583801269531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,8,power_law_1.01,0.11808639764785767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,8,power_law_1.2,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,8,power_law_1.01,0.06849279999732971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,16,power_law_1.2,0.8977151870727539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,8,power_law_1.01,0.12649600505828856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,8,power_law_1.01,0.07297919988632202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,8,power_law_1.2,0.0751039981842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,16,power_law_1.2,1.4920639991760254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,8,power_law_1.01,0.15742720365524293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,8,power_law_1.01,0.07935360074043274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,8,power_law_1.2,0.09351680278778077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,8,power_law_1.01,0.22191998958587647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,8,power_law_1.01,0.08753920197486878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,8,power_law_1.2,0.09351680278778077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,16,power_law_1.2,2.9487871170043944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,8,power_law_1.01,0.2893183946609497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,8,power_law_1.01,0.0906112015247345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,8,power_law_1.2,0.1162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,8,power_law_1.01,0.4159872055053711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,8,power_law_1.01,0.0930624008178711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,8,power_law_1.2,0.13366400003433226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,8,power_law_1.01,0.09594240188598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,8,power_law_1.01,0.5604608058929443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,8,power_law_1.2,0.1582335948944092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,8,power_law_1.2,0.08076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,8,power_law_1.01,0.09264640212059021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,8,power_law_1.2,0.2246016025543213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,8,power_law_1.01,0.8056063652038574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,8,power_law_1.2,0.08138239979743958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,8,power_law_1.01,0.09388800263404846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,8,power_law_1.2,0.2938175916671753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,8,power_law_1.2,0.06233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,8,power_law_1.01,1.0226943969726563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,8,power_law_1.01,0.09634559750556945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,8,power_law_1.2,0.06725760102272034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,8,power_law_1.2,0.42736001014709474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,8,power_law_1.01,1.3440192222595215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,8,power_law_1.01,0.1004480004310608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,8,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,8,power_law_1.2,0.5506239891052246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,8,power_law_1.01,2.112851142883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,8,power_law_1.01,0.10699520111083985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,8,power_law_1.2,0.07462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,8,power_law_1.2,0.8240447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,8,power_law_1.01,0.10842880010604858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,8,power_law_1.01,4.138528060913086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,8,power_law_1.2,0.08446080088615418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,8,power_law_1.2,1.0403072357177734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,8,power_law_1.01,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,8,power_law_1.2,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,8,power_law_1.01,0.13525760173797607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,8,power_law_1.2,1.3366527557373047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,8,power_law_1.2,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,8,power_law_1.01,0.14960000514984131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,128,power_law_1.01,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,8,power_law_1.2,2.145625686645508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,8,power_law_1.2,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,8,power_law_1.01,0.17866239547729493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,128,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,8,power_law_1.2,0.09448959827423095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,128,power_law_1.01,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,8,power_law_1.2,4.480742263793945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,8,power_law_1.01,0.20344319343566894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,8,power_law_1.2,0.09633920192718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,128,power_law_1.01,0.018963199853897095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,8,power_law_1.01,0.24542720317840577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,128,power_law_1.01,0.01959040015935898
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,8,power_law_1.2,0.09633920192718506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,8,power_law_1.01,0.2789952039718628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,128,power_law_1.01,0.020812800526618956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,1,128,power_law_1.2,0.018777599930763243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,8,power_law_1.2,0.10248960256576538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,8,power_law_1.01,0.3867392063140869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,128,power_law_1.01,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,1,128,power_law_1.2,0.018572799861431122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,8,power_law_1.2,0.1061568021774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,8,power_law_1.01,0.46825599670410156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,128,power_law_1.01,0.023680000007152556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,1,128,power_law_1.2,0.018572799861431122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,8,power_law_1.2,0.11352959871292115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,8,power_law_1.01,0.6777599811553955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,128,power_law_1.01,0.025523200631141663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,1,128,power_law_1.2,0.018559999763965607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,8,power_law_1.2,0.12112640142440796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,128,power_law_1.01,0.026348799467086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,8,power_law_1.01,0.8870783805847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,1,128,power_law_1.2,0.019193600118160247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,8,power_law_1.2,0.1372928023338318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,128,power_law_1.01,0.029836800694465638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,1,128,power_law_1.2,0.020627200603485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,8,power_law_1.01,1.0234623908996583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,8,power_law_1.2,0.15446399450302123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,128,power_law_1.01,0.027161601185798644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,1,128,power_law_1.2,0.022252799570560457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,8,power_law_1.01,1.6419647216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,8,power_law_1.2,0.17497600317001344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,128,power_law_1.01,0.0281792014837265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,1,128,power_law_1.2,0.024300800263881685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,128,power_law_1.01,0.03043839931488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,8,power_law_1.2,0.19871360063552856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,1,128,power_law_1.2,0.026348799467086792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,8,power_law_1.01,3.29510383605957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,128,power_law_1.01,0.030028799176216127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,1,128,power_law_1.2,0.02717440128326416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,8,power_law_1.2,0.2661119937896729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,128,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,1,128,power_law_1.2,0.02821120023727417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,8,power_law_1.2,0.3089215993881226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,128,power_law_1.01,0.034329599142074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,128,power_law_1.01,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,1,128,power_law_1.2,0.02717440128326416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,8,power_law_1.2,0.4039423942565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,128,power_law_1.01,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,128,power_law_1.01,0.03982079923152924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,1,128,power_law_1.2,0.027584001421928406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,8,power_law_1.2,0.5153535842895508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.01,0.04806399941444397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,128,power_law_1.01,0.039801600575447085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,1,128,power_law_1.2,0.03167999982833862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,8,power_law_1.2,0.7420671939849853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.01,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,128,power_law_1.01,0.03960959911346436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,1,128,power_law_1.2,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,128,power_law_1.01,0.039212799072265624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,1,128,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,8,power_law_1.2,0.8727359771728516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.01,0.1064255952835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,128,power_law_1.01,0.039827200770378116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,1,128,power_law_1.2,0.03454720079898834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,8,power_law_1.2,1.1330368041992187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,128,power_law_1.01,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.01,0.11994880437850952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,1,128,power_law_1.2,0.042745599150657655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,8,power_law_1.2,1.7894079208374023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,128,power_law_1.01,0.04126079976558685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.2,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,128,power_law_1.01,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.2,0.06667519807815551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,8,power_law_1.2,3.4699966430664064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,128,power_law_1.01,0.040031999349594116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.2,0.08247680068016053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,128,power_law_1.01,0.041875201463699344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.2,0.10439039468765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,128,power_law_1.01,0.0416703999042511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.2,0.13797760009765625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,1,128,power_law_1.2,0.040249601006507874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,128,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.2,0.19447679519653321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,1,128,power_law_1.2,0.03919360041618347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,128,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.2,0.257587194442749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,1,128,power_law_1.2,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,128,power_law_1.01,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,1,128,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.2,0.3808448076248169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,128,power_law_1.01,0.04843519926071167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,1,128,power_law_1.2,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.2,0.4994239807128906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,128,power_law_1.01,0.0488319993019104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,1,128,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,128,power_law_1.2,0.619865608215332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,128,power_law_1.01,0.054553598165512085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,1,128,power_law_1.2,0.03960959911346436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.01,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,128,power_law_1.2,0.9768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,1,128,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.01,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,1,128,power_law_1.2,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,128,power_law_1.2,1.9346752166748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.01,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,1,128,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.01,0.09593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,1,128,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.01,0.10821759700775146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,1,128,power_law_1.2,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,64,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.01,0.1418176054954529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,1,128,power_law_1.2,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,64,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.01,0.17273600101470948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,1,128,power_law_1.2,0.04431999921798706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,64,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.01,0.25363199710845946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,1,128,power_law_1.2,0.04759680032730103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,64,power_law_1.01,0.017951999604701997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,1,128,power_law_1.2,0.047167998552322385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,64,power_law_1.01,0.018777599930763243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.01,0.31466240882873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,64,power_law_1.01,0.02143999934196472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,1,128,power_law_1.2,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,128,power_law_1.01,0.4092735767364502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,64,power_law_1.01,0.022060799598693847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,1,128,power_law_1.2,0.056601601839065555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,128,power_law_1.01,0.6962111949920654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,64,power_law_1.01,0.024902400374412537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.2,0.06419199705123901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,64,power_law_1.01,0.02512640058994293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,128,power_law_1.01,1.370201587677002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.2,0.07319679856300354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,64,power_law_1.01,0.029824000597000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.2,0.08630399703979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,64,power_law_1.01,0.02963840067386627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.2,0.11272319555282592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,64,power_law_1.01,0.028191998600959778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.2,0.13648639917373656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,64,power_law_1.2,0.019756799936294554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,64,power_law_1.01,0.030656000971794127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,64,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.2,0.19013760089874268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,64,power_law_1.01,0.030035200715065002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,64,power_law_1.2,0.018931199610233308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.2,0.21962239742279052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,64,power_law_1.01,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,64,power_law_1.2,0.01913599967956543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.2,0.3248960018157959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,64,power_law_1.01,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,64,power_law_1.2,0.01974399983882904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.2,0.43646721839904784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,64,power_law_1.01,0.034329599142074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,64,power_law_1.2,0.022598400712013245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,64,power_law_1.01,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,1,128,power_law_1.2,0.53788161277771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,64,power_law_1.2,0.022617599368095397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,64,power_law_1.01,0.04805760085582733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,64,power_law_1.2,0.023852799832820893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,1,128,power_law_1.2,0.8375103950500489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,64,power_law_1.01,0.061791998147964475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,64,power_law_1.2,0.026092800498008727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,1,128,power_law_1.2,1.6407295227050782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,64,power_law_1.01,0.07817599773406983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,64,power_law_1.2,0.029996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,64,power_law_1.01,0.0964031994342804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,64,power_law_1.2,0.03163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,64,power_law_1.01,0.13038719892501832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,64,power_law_1.2,0.031615999341011045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,64,power_law_1.01,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,64,power_law_1.2,0.031430399417877196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,64,power_law_1.01,0.1828160047531128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,64,power_law_1.01,0.04245760142803192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,64,power_law_1.2,0.03223679959774017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,64,power_law_1.01,0.2213184118270874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,64,power_law_1.01,0.03919999897480011
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,64,power_law_1.2,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,64,power_law_1.01,0.3192064046859741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,64,power_law_1.01,0.03858560025691986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,64,power_law_1.2,0.0361407995223999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,64,power_law_1.01,0.46053118705749513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,64,power_law_1.2,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,64,power_law_1.01,0.04022400081157684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,64,power_law_1.01,0.5276991844177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,64,power_law_1.01,0.040838399529457094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,64,power_law_1.2,0.04535680115222931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,64,power_law_1.01,0.8834495544433594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,64,power_law_1.2,0.050470399856567386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,64,power_law_1.01,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,64,power_law_1.2,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,64,power_law_1.01,0.04083200097084046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,64,power_law_1.01,1.7566335678100586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,64,power_law_1.2,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,64,power_law_1.01,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,64,power_law_1.2,0.11293439865112305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,64,power_law_1.01,0.04103040099143982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,64,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,64,power_law_1.2,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,64,power_law_1.01,0.04145280122756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,64,power_law_1.2,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,64,power_law_1.01,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,64,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,64,power_law_1.01,0.04309119880199432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,64,power_law_1.2,0.03864319920539856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,64,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,64,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,64,power_law_1.01,0.04615679979324341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,64,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,64,power_law_1.01,0.04677119851112366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,64,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,64,power_law_1.01,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,64,power_law_1.2,0.04069119989871979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,64,power_law_1.01,0.05578240156173706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,64,power_law_1.2,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,64,power_law_1.01,0.060063999891281125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,64,power_law_1.2,0.04028159976005554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,64,power_law_1.01,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,64,power_law_1.2,0.041510400176048276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,64,power_law_1.01,0.07667840123176575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,64,power_law_1.2,0.043347200751304625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,64,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,64,power_law_1.2,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,64,power_law_1.01,0.11845760345458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,64,power_law_1.2,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,64,power_law_1.01,0.14466559886932373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,64,power_law_1.2,0.04848000109195709
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,64,power_law_1.01,0.17763199806213378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,64,power_law_1.2,0.048467200994491574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,64,power_law_1.01,0.23519361019134521
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,64,power_law_1.2,0.05297279953956604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,64,power_law_1.01,0.3066688060760498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,64,power_law_1.2,0.05687680244445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,64,power_law_1.2,0.06670719981193543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,64,power_law_1.01,0.3920639991760254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,64,power_law_1.2,0.07427840232849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,64,power_law_1.01,0.5706560134887695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,64,power_law_1.2,0.08307200074195861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,64,power_law_1.2,0.10922880172729492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,64,power_law_1.01,1.232147216796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,64,power_law_1.2,0.13243520259857178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,64,power_law_1.2,0.19407999515533447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,64,power_law_1.2,0.20677120685577394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,32,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,64,power_law_1.2,0.30385921001434324
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,32,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,32,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,64,power_law_1.2,0.48506879806518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,32,power_law_1.01,0.018918399512767792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,64,power_law_1.2,0.49779839515686036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,32,power_law_1.01,0.019334399700164796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,64,power_law_1.2,0.9944319725036621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,32,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,32,power_law_1.01,0.021996800601482392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,64,power_law_1.2,2.152582359313965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,32,power_law_1.01,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,32,power_law_1.01,0.02361599951982498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,32,power_law_1.01,0.02526719868183136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,32,power_law_1.2,0.018367999792099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,32,power_law_1.01,0.029574400186538695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,32,power_law_1.2,0.018771199882030486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,32,power_law_1.01,0.025472000241279602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,32,power_law_1.2,0.018367999792099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,32,power_law_1.01,0.026086398959159852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,32,power_law_1.2,0.018566399812698364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,32,power_law_1.01,0.030796799063682555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,32,power_law_1.2,0.01918720006942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,32,power_law_1.01,0.027929601073265076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,32,power_law_1.2,0.02001280039548874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,32,power_law_1.01,0.03059200048446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,32,power_law_1.2,0.02143999934196472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,32,power_law_1.01,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,32,power_law_1.2,0.022035199403762817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,32,power_law_1.01,0.040217599272727965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,32,power_law_1.2,0.02328319996595383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,32,power_law_1.01,0.04922879934310913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,32,power_law_1.2,0.024710400402545928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,32,power_law_1.01,0.06069759726524353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,32,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,32,power_law_1.01,0.07257599830627441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,32,power_law_1.2,0.02654080092906952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,32,power_law_1.01,0.10780800580978393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,32,power_law_1.2,0.028191998600959778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,32,power_law_1.01,0.11967999935150146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,32,power_law_1.2,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,32,power_law_1.01,0.17006720304489137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,32,power_law_1.2,0.02964479923248291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,32,power_law_1.01,0.2228991985321045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,32,power_law_1.2,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,32,power_law_1.01,0.2921344041824341
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,32,power_law_1.2,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,32,power_law_1.01,0.4321983814239502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,32,power_law_1.2,0.04519039988517761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,32,power_law_1.01,0.53788161277771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,32,power_law_1.2,0.049491199851036075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,32,power_law_1.2,0.06260480284690857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,32,power_law_1.01,0.8301376342773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,32,power_law_1.2,0.07859200239181519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,32,power_law_1.01,1.7795904159545899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,32,power_law_1.2,0.10732799768447876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,32,power_law_1.2,0.12382719516754151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,32,power_law_1.2,0.19265279769897461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,32,power_law_1.01,0.04431360065937042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,32,power_law_1.2,0.24261119365692138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,32,power_law_1.01,0.04268159866333008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,32,power_law_1.2,0.36160640716552733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,32,power_law_1.01,0.03777279853820801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,32,power_law_1.2,0.5043519973754883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,32,power_law_1.01,0.03837440013885498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,32,power_law_1.01,0.039603200554847715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.01,0.1695039987564087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,32,power_law_1.2,0.6385151863098144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,32,power_law_1.01,0.041247999668121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.01,0.21884799003601074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,32,power_law_1.2,1.076140785217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,32,power_law_1.01,0.0412416011095047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.01,0.3308864116668701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,32,power_law_1.01,0.041657599806785586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,32,power_law_1.2,2.1361919403076173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.01,0.4074751853942871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,32,power_law_1.01,0.041868799924850465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,1,128,power_law_1.01,0.5371071815490722
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,32,power_law_1.01,0.04186240136623383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,1,128,power_law_1.01,0.8584383964538574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,32,power_law_1.2,0.04478079974651337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,32,power_law_1.01,0.04349440038204193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,32,power_law_1.2,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,32,power_law_1.01,0.04349440038204193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,1,128,power_law_1.01,1.5850751876831055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,32,power_law_1.2,0.03678080141544342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,32,power_law_1.01,0.04431999921798706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,32,power_law_1.2,0.03813759982585907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,32,power_law_1.01,0.04514560103416443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,32,power_law_1.2,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,32,power_law_1.01,0.048819199204444885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,32,power_law_1.2,0.04047360122203827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,32,power_law_1.01,0.05088000297546387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,32,power_law_1.01,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,32,power_law_1.2,0.04110719859600067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,32,power_law_1.01,0.05251200199127197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,32,power_law_1.01,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,32,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,32,power_law_1.01,0.05783039927482605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,32,power_law_1.01,0.02245119959115982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,32,power_law_1.2,0.04191359877586365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,32,power_law_1.01,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,32,power_law_1.01,0.022438399493694305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,32,power_law_1.2,0.041510400176048276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,32,power_law_1.01,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,32,power_law_1.01,0.025727999210357667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,32,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,32,power_law_1.01,0.08301439881324768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,32,power_law_1.01,0.024512000381946564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,32,power_law_1.2,0.04416640102863312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,32,power_law_1.01,0.10289280414581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,32,power_law_1.01,0.02648960053920746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,32,power_law_1.2,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,32,power_law_1.01,0.12009600400924683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,32,power_law_1.01,0.02983039915561676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,32,power_law_1.2,0.04519680142402649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,32,power_law_1.01,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,32,power_law_1.01,0.15491199493408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,32,power_law_1.2,0.04907520115375519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,32,power_law_1.01,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,32,power_law_1.01,0.19259519577026368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,32,power_law_1.2,0.05134080052375793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,32,power_law_1.01,0.042124798893928526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,32,power_law_1.01,0.2784064054489136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,32,power_law_1.2,0.0546176016330719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,32,power_law_1.01,0.04620800018310547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,32,power_law_1.01,0.33145599365234374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,32,power_law_1.2,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,32,power_law_1.01,0.039647999405860904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,32,power_law_1.01,0.43016958236694336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,32,power_law_1.2,0.06547200083732604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,32,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,32,power_law_1.01,0.5784255981445312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,32,power_law_1.2,0.07736319899559022
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,32,power_law_1.01,0.049497601389884946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,32,power_law_1.2,0.08268160223960877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,32,power_law_1.01,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,32,power_law_1.01,1.2976896286010742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,32,power_law_1.2,0.11215360164642334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,32,power_law_1.01,0.05030400156974792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,32,power_law_1.2,0.13610880374908446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,32,power_law_1.01,0.06172800064086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,32,power_law_1.01,0.07222399711608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,32,power_law_1.2,0.20668160915374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,32,power_law_1.01,0.09373440146446228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,32,power_law_1.2,0.23319039344787598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,2560,8,160,4,32,power_law_1.2,0.02343039959669113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,32,power_law_1.01,0.10663039684295654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,32,power_law_1.2,0.32965760231018065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,2560,8,160,4,32,power_law_1.2,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,32,power_law_1.01,0.15433599948883056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,2560,8,160,4,32,power_law_1.2,0.022598400712013245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,32,power_law_1.2,0.40748162269592286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,32,power_law_1.01,0.19571839570999144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,2560,8,160,4,32,power_law_1.2,0.02240000069141388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,32,power_law_1.2,0.7105855941772461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,32,power_law_1.01,0.3079360008239746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,2560,8,160,4,32,power_law_1.2,0.025068798661231996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,32,power_law_1.2,0.9231679916381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,2560,8,160,4,32,power_law_1.2,0.024665600061416625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,32,power_law_1.01,0.3738816022872925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,32,power_law_1.2,2.2213951110839845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,2560,8,160,4,32,power_law_1.2,0.026700800657272337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,32,power_law_1.01,0.5788864135742188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,2560,8,160,4,32,power_law_1.2,0.03407999873161316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,32,power_law_1.01,0.7195903778076171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,2560,8,160,4,32,power_law_1.2,0.035718399286270144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,32,power_law_1.01,0.938316822052002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,32,power_law_1.01,0.07427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,2560,8,160,4,32,power_law_1.2,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,32,power_law_1.01,1.5703231811523437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,32,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,2560,8,160,4,32,power_law_1.2,0.0416703999042511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,32,power_law_1.01,0.05564799904823303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,2560,8,160,4,32,power_law_1.2,0.047788798809051514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,32,power_law_1.01,3.1603904724121095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,32,power_law_1.01,0.05687680244445801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,2560,8,160,4,32,power_law_1.2,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,32,power_law_1.01,0.0574783980846405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,2560,8,160,4,32,power_law_1.2,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,32,power_law_1.01,0.058905601501464844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,2560,8,160,4,32,power_law_1.2,0.0525056004524231
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,2560,8,160,4,32,power_law_1.2,0.07365120053291321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,32,power_law_1.01,0.0611840009689331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,2560,8,160,4,32,power_law_1.2,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,2560,8,160,4,32,power_law_1.2,0.05727999806404114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,32,power_law_1.01,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,2560,8,160,4,32,power_law_1.2,0.05278080105781555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,2560,8,160,4,32,power_law_1.2,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,32,power_law_1.01,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,2560,8,160,4,32,power_law_1.2,0.05622400045394897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,2560,8,160,4,32,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,64,power_law_1.2,0.2016063928604126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,32,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,2560,8,160,4,32,power_law_1.2,0.05665919780731201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,2560,8,160,4,32,power_law_1.2,0.07893120050430298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,64,power_law_1.2,0.2747200012207031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,32,power_law_1.01,0.06384639739990235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,2560,8,160,4,32,power_law_1.2,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,2560,8,160,4,32,power_law_1.2,0.10329600572586059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,64,power_law_1.2,0.3898047924041748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,32,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,2560,8,160,4,32,power_law_1.2,0.06074879765510559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,2560,8,160,4,32,power_law_1.2,0.1258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,64,power_law_1.2,0.5222976207733154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,32,power_law_1.01,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,2560,8,160,4,32,power_law_1.2,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,2560,8,160,4,32,power_law_1.2,0.17129600048065186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,64,power_law_1.2,0.6503168106079101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,32,power_law_1.01,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,2560,8,160,4,32,power_law_1.2,0.061977601051330565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,2560,8,160,4,32,power_law_1.2,0.24174718856811522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,64,power_law_1.2,1.0337023735046387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,32,power_law_1.01,0.0726527988910675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,2560,8,160,4,32,power_law_1.2,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,2560,8,160,4,32,power_law_1.2,0.34495360851287843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,32,power_law_1.01,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,2560,8,160,4,32,power_law_1.2,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,64,power_law_1.2,2.017363166809082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,2560,8,160,4,32,power_law_1.2,0.4408127784729004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,32,power_law_1.01,0.07938560247421264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,2560,8,160,4,32,power_law_1.2,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,2560,8,160,4,32,power_law_1.2,0.7072512149810791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,32,power_law_1.01,0.08862079977989197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,2560,8,160,4,32,power_law_1.2,0.06565759778022766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,2560,8,160,4,32,power_law_1.2,0.8792832374572754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,32,power_law_1.01,0.09987199902534485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,2560,8,160,4,32,power_law_1.2,0.06935039758682252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,128,power_law_1.01,0.09203199744224548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,2560,8,160,4,32,power_law_1.2,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,32,power_law_1.01,0.12055039405822754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,2560,8,160,4,32,power_law_1.2,1.120748805999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,128,power_law_1.01,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,2560,8,160,4,32,power_law_1.2,0.07571840286254883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,32,power_law_1.01,0.1328511953353882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,2560,8,160,4,32,power_law_1.2,1.8233983993530274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,128,power_law_1.01,0.06869760155677795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,2560,8,160,4,32,power_law_1.2,0.08083199858665466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,32,power_law_1.01,0.17400959730148316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,128,power_law_1.01,0.05968639850616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,2560,8,160,4,32,power_law_1.2,0.09208319783210754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,32,power_law_1.01,0.187116801738739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,2560,8,160,4,32,power_law_1.2,4.041401672363281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,2560,8,160,4,32,power_law_1.2,0.10396800041198731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,128,power_law_1.01,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,32,power_law_1.01,0.2710975885391235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,2560,8,160,4,32,power_law_1.2,0.1275264024734497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,32,power_law_1.01,0.29976320266723633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,128,power_law_1.01,0.0621504008769989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,2560,8,160,4,32,power_law_1.2,0.1445248007774353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,1,128,power_law_1.2,0.07811200022697448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,128,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,32,power_law_1.01,0.43021440505981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,2560,8,160,4,32,power_law_1.2,0.1832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,1,128,power_law_1.2,0.07870720028877258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,128,power_law_1.01,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,32,power_law_1.01,0.5702976226806641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,2560,8,160,4,32,power_law_1.2,0.21700479984283447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,1,128,power_law_1.2,0.06603519916534424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,128,power_law_1.01,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,32,power_law_1.01,0.674124813079834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,2560,8,160,4,32,power_law_1.2,0.29054720401763917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,128,power_law_1.01,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,1,128,power_law_1.2,0.058873599767684935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,32,power_law_1.01,1.1945343971252442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,2560,8,160,4,32,power_law_1.2,0.3955967903137207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,128,power_law_1.01,0.06929919719696045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,1,128,power_law_1.2,0.06111360192298889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,2560,8,160,4,32,power_law_1.2,0.5338431835174561
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,32,power_law_1.01,2.158278465270996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,128,power_law_1.01,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,1,128,power_law_1.2,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,2560,8,160,4,32,power_law_1.2,0.7040256023406982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,128,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,2560,8,160,4,32,power_law_1.2,0.90513916015625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,1,128,power_law_1.2,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,64,power_law_1.01,0.07325440049171447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,128,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,1,128,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,2560,8,160,4,32,power_law_1.2,1.3776127815246582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,64,power_law_1.01,0.09331200122833253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,128,power_law_1.01,0.0797439992427826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,1,128,power_law_1.2,0.06502400040626526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,2560,8,160,4,32,power_law_1.2,3.160396766662598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,64,power_law_1.01,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,128,power_law_1.01,0.08199679851531982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,1,128,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,64,power_law_1.01,0.05931519865989685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,128,power_law_1.01,0.08733440041542054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,1,128,power_law_1.2,0.07032319903373718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,64,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,128,power_law_1.01,0.10248960256576538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,64,power_law_1.2,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,1,128,power_law_1.2,0.06993920207023621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,64,power_law_1.01,0.06321920156478882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,128,power_law_1.01,0.11558400392532349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,64,power_law_1.2,0.09207680225372314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,1,128,power_law_1.2,0.07278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,128,power_law_1.01,0.13854080438613892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,64,power_law_1.01,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,64,power_law_1.2,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,1,128,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,128,power_law_1.01,0.15368959903717042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,64,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,1,128,power_law_1.2,0.08076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,128,power_law_1.01,0.1942463994026184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,64,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,1,128,power_law_1.2,0.08466560244560242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,128,power_law_1.01,0.22474238872528077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,64,power_law_1.01,0.06750720143318176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,1,128,power_law_1.2,0.08978559970855712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,128,power_law_1.01,0.29767038822174074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,64,power_law_1.01,0.070796799659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,1,128,power_law_1.2,0.1080064058303833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,64,power_law_1.01,0.07037439942359924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,128,power_law_1.01,0.37854719161987305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,1,128,power_law_1.2,0.1155776023864746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,64,power_law_1.01,0.07404800057411194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,128,power_law_1.01,0.5407680034637451
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,1,128,power_law_1.2,0.14016640186309814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,64,power_law_1.01,0.07200639843940734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,1,128,power_law_1.2,0.16186879873275756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,128,power_law_1.01,0.6686975955963135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,64,power_law_1.01,0.0787775993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,1,128,power_law_1.2,0.20856959819793702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,128,power_law_1.01,0.8301440238952636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,64,power_law_1.01,0.08327040076255798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,1,128,power_law_1.2,0.2405247926712036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,128,power_law_1.01,1.2796735763549805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,64,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,1,128,power_law_1.2,0.32751998901367185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,128,power_law_1.01,2.537753677368164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,64,power_law_1.01,0.09965440034866332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,1,128,power_law_1.2,0.4059840202331543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,64,power_law_1.01,0.11584000587463379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,1,128,power_law_1.2,0.5714623928070068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,64,power_law_1.01,0.134278404712677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,32,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,1,128,power_law_1.2,0.7510784149169922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,64,power_law_1.01,0.1541375994682312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,32,power_law_1.01,0.0760703980922699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,1,128,power_law_1.2,0.9882304191589355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,64,power_law_1.01,0.197324800491333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,32,power_law_1.01,0.07400959730148315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,64,power_law_1.01,0.22520959377288818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,1,128,power_law_1.2,1.5362751960754395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,32,power_law_1.01,0.06133120059967041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,64,power_law_1.01,0.30139520168304446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,32,power_law_1.01,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,1,128,power_law_1.2,3.0495424270629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,64,power_law_1.01,0.37348480224609376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,32,power_law_1.01,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,64,power_law_1.01,0.5076288223266602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,32,power_law_1.01,0.07054719924926758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,64,power_law_1.01,0.6532159805297851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,32,power_law_1.2,0.07360640168190002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,32,power_law_1.01,0.0732096016407013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,64,power_law_1.01,0.8260736465454102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,32,power_law_1.2,0.07995520234107971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,32,power_law_1.01,0.0736191987991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,32,power_law_1.2,0.07278720140457154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,32,power_law_1.01,0.07545599937438965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,64,power_law_1.01,1.2469632148742675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,32,power_law_1.01,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,32,power_law_1.2,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,64,power_law_1.01,2.536992073059082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,32,power_law_1.01,0.08118399977684021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,32,power_law_1.2,0.06232960224151611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,32,power_law_1.01,0.08078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,32,power_law_1.2,0.06664959788322448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,32,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,32,power_law_1.2,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,16,power_law_1.01,0.07199360132217407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,32,power_law_1.01,0.09184640049934387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,32,power_law_1.2,0.0705407977104187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,16,power_law_1.01,0.08021759986877441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,32,power_law_1.01,0.09102079868316651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,32,power_law_1.2,0.07196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,16,power_law_1.01,0.08819839954376221
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,32,power_law_1.01,0.09635199904441834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,32,power_law_1.2,0.07790719866752624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,16,power_law_1.01,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,32,power_law_1.01,0.10945919752120972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,32,power_law_1.2,0.07832959890365601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,16,power_law_1.01,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,32,power_law_1.01,0.12277120351791382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,32,power_law_1.2,0.08035200238227844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,16,power_law_1.01,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,32,power_law_1.01,0.1450943946838379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,32,power_law_1.2,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,16,power_law_1.01,0.07448319792747497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,32,power_law_1.01,0.16537599563598632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,32,power_law_1.2,0.08117759823799134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,16,power_law_1.01,0.07774720191955567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,32,power_law_1.01,0.20734720230102538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,32,power_law_1.2,0.08730239868164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,16,power_law_1.01,0.07816320061683654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,32,power_law_1.01,0.2442176103591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,32,power_law_1.2,0.09305599927902222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,16,power_law_1.01,0.08328319787979126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,32,power_law_1.01,0.3187648057937622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,32,power_law_1.2,0.09675520062446594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,16,power_law_1.01,0.08124160170555114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,32,power_law_1.01,0.3949440002441406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,32,power_law_1.2,0.1131327986717224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,16,power_law_1.01,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,32,power_law_1.01,0.5395391941070556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,32,power_law_1.2,0.12254079580307006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,16,power_law_1.01,0.08840960264205933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,32,power_law_1.2,0.14835200309753419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,16,power_law_1.01,0.0877951979637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,32,power_law_1.01,0.6998847961425781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,32,power_law_1.2,0.1708799958229065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,16,power_law_1.01,0.09783040285110474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,32,power_law_1.01,0.82357759475708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,16,power_law_1.01,0.09905279874801635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,32,power_law_1.2,0.20692479610443115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,32,power_law_1.01,1.3116352081298828
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,16,power_law_1.01,0.1064255952835083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,32,power_law_1.2,0.24440319538116456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,32,power_law_1.01,2.5344768524169923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,16,power_law_1.01,0.12117120027542114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,32,power_law_1.2,0.33063039779663084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,16,power_law_1.01,0.13408000469207765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,32,power_law_1.2,0.41869440078735354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,16,power_law_1.01,0.1584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,32,power_law_1.2,0.6128384113311768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,16,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,16,power_law_1.01,0.18465280532836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,32,power_law_1.2,0.7658304214477539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,16,power_law_1.2,0.08079360127449035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,16,power_law_1.01,0.23320319652557372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,16,power_law_1.2,0.07565439939498901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,32,power_law_1.2,0.908351993560791
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,16,power_law_1.01,0.26124160289764403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,16,power_law_1.2,0.061536002159118655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,16,power_law_1.01,0.3570879936218262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,32,power_law_1.2,1.4365440368652345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,16,power_law_1.2,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,16,power_law_1.01,0.43799681663513185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,32,power_law_1.2,2.9909759521484376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,16,power_law_1.2,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,16,power_law_1.01,0.6055359840393066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,16,power_law_1.2,0.07707520127296448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,16,power_law_1.01,0.7822720050811768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,16,power_law_1.2,0.08099200129508972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,16,power_law_1.01,0.96495361328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,8,power_law_1.01,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,16,power_law_1.2,0.08236799836158752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,8,power_law_1.01,0.08524799942970276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,16,power_law_1.01,1.4058752059936523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,16,power_law_1.2,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,8,power_law_1.01,0.10371840000152588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,16,power_law_1.2,0.08732159733772278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,16,power_law_1.01,2.7526527404785157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,8,power_law_1.01,0.06765440106391907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,16,power_law_1.2,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,8,power_law_1.01,0.07378559708595275
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,16,power_law_1.2,0.09073920249938965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,8,power_law_1.01,0.08486400246620178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,16,power_law_1.2,0.09041280150413514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,8,power_law_1.2,0.07939839959144593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,8,power_law_1.01,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,16,power_law_1.2,0.09715840220451355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,8,power_law_1.2,0.08513280153274536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,8,power_law_1.01,0.0942911982536316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,16,power_law_1.2,0.10289920568466186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,8,power_law_1.2,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,8,power_law_1.01,0.09921280145645142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,16,power_law_1.2,0.11090559959411621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,8,power_law_1.2,0.0648639976978302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,8,power_law_1.01,0.10412160158157349
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,16,power_law_1.2,0.12502399682998658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,8,power_law_1.2,0.06917120218276977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,16,power_law_1.2,0.1430400013923645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,8,power_law_1.01,0.10514559745788574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,8,power_law_1.2,0.07692800164222717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,16,power_law_1.2,0.1686336040496826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,8,power_law_1.01,0.11190400123596192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,8,power_law_1.2,0.08410239815711976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,16,power_law_1.2,0.18644479513168336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,8,power_law_1.01,0.1123136043548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,8,power_law_1.2,0.09575679898262024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,16,power_law_1.2,0.23479681015014647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,8,power_law_1.01,0.11764479875564575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,8,power_law_1.2,0.09475839734077454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,16,power_law_1.2,0.2765631914138794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,8,power_law_1.01,0.12460160255432129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,8,power_law_1.2,0.10067199468612671
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,16,power_law_1.2,0.36586239337921145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,8,power_law_1.01,0.12848639488220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,8,power_law_1.2,0.10539519786834717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,8,power_law_1.01,0.13647359609603882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,16,power_law_1.2,0.4559807777404785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,8,power_law_1.2,0.1090880036354065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,8,power_law_1.01,0.1565567970275879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,16,power_law_1.2,0.6507391929626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,8,power_law_1.2,0.10929919481277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,8,power_law_1.01,0.17313920259475707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,16,power_law_1.2,0.9014016151428222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,8,power_law_1.2,0.11463040113449097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,8,power_law_1.01,0.20119040012359618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,16,power_law_1.2,1.0222399711608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,8,power_law_1.2,0.12033280134201049
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,8,power_law_1.01,0.2263808012008667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,16,power_law_1.2,1.5977215766906738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,8,power_law_1.2,0.12527999877929688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,8,power_law_1.01,0.2847424030303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,16,power_law_1.2,3.0929855346679687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,8,power_law_1.2,0.14325759410858155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,8,power_law_1.01,0.3306368112564087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,8,power_law_1.2,0.1584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,8,power_law_1.01,0.43875842094421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,8,power_law_1.2,0.16888959407806398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,8,power_law_1.01,0.5239615917205811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,8,power_law_1.2,0.20821120738983154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,8,power_law_1.01,0.7555903911590576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,8,power_law_1.2,0.2385279893875122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,8,power_law_1.01,0.9444031715393066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,8,power_law_1.2,0.2874624013900757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,8,power_law_1.01,1.1444992065429687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,8,power_law_1.2,0.33785600662231446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,8,power_law_1.2,0.44947199821472167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,8,power_law_1.01,1.7742591857910157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,power_law_1.01,0.029791998863220214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,8,power_law_1.2,0.5555520057678223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,power_law_1.01,0.029996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,8,power_law_1.01,3.589811325073242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,power_law_1.01,0.029996800422668456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,8,power_law_1.2,0.7703807830810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,power_law_1.01,0.0297791987657547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,power_law_1.01,0.03204480111598969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,8,power_law_1.2,0.977235221862793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,power_law_1.01,0.039827200770378116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,8,power_law_1.2,1.2805439949035644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,power_law_1.01,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,64,power_law_1.2,0.058899199962615965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,power_law_1.01,0.03245440125465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,64,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,8,power_law_1.2,1.9354944229125977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,power_law_1.01,0.03287039995193482
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,64,power_law_1.2,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,power_law_1.01,0.034092798829078674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,8,power_law_1.2,3.8728958129882813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,64,power_law_1.2,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,power_law_1.01,0.03450239896774292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,power_law_1.01,0.034694400429725644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,64,power_law_1.2,0.06547200083732604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,power_law_1.2,0.03038719892501831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,power_law_1.01,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,power_law_1.2,0.029977598786354066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,power_law_1.01,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,64,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,power_law_1.2,0.029772800207138062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,64,power_law_1.2,0.06791679859161377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,power_law_1.01,0.048019200563430786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,power_law_1.2,0.029977598786354066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,power_law_1.01,0.05723519921302796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,power_law_1.2,0.030579200387001036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,64,power_law_1.2,0.06893439888954163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,power_law_1.01,0.05783039927482605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,power_law_1.2,0.03735679984092712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,64,power_law_1.2,0.07180799841880799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,power_law_1.01,0.07668480277061462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,power_law_1.2,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,power_law_1.01,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,power_law_1.2,0.03164800107479095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,64,power_law_1.2,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,power_law_1.01,0.1205183982849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,power_law_1.2,0.03159680068492889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,64,power_law_1.2,0.07386239767074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,power_law_1.01,0.10413440465927123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,power_law_1.2,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,power_law_1.01,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,power_law_1.01,0.1506175994873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,64,power_law_1.2,0.08023040294647217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,power_law_1.2,0.03285120129585266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,power_law_1.01,0.03597440123558045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,power_law_1.2,0.03529599905014038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,64,power_law_1.2,0.08266239762306213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,power_law_1.01,0.03475840091705322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,power_law_1.2,0.03470079898834229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,64,power_law_1.2,0.09228799939155578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,power_law_1.01,0.03229439854621887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,power_law_1.2,0.035308799147605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,power_law_1.01,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,power_law_1.2,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,64,power_law_1.2,0.10150400400161744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,power_law_1.01,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,power_law_1.2,0.043296000361442565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,64,power_law_1.2,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,power_law_1.01,0.03373439908027649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,power_law_1.2,0.046348801255226134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,power_law_1.01,0.033932799100875856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,power_law_1.2,0.05559039711952209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,64,power_law_1.2,0.14410239458084106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,power_law_1.2,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,64,power_law_1.2,0.15843199491500853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,power_law_1.01,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,power_law_1.2,0.07994239926338195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,power_law_1.01,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,power_law_1.2,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,64,power_law_1.2,0.21004800796508788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,power_law_1.01,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,power_law_1.2,0.10003199577331542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,64,power_law_1.2,0.23790719509124755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,power_law_1.01,0.03782399892807007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,power_law_1.2,0.09960960149765015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,power_law_1.01,0.041715198755264284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,power_law_1.2,0.15736960172653197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,64,power_law_1.2,0.32699520587921144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,power_law_1.01,0.047417598962783816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,power_law_1.2,0.18191360235214232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,64,power_law_1.2,0.3968384027481079
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,power_law_1.01,0.04807040095329285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,power_law_1.2,0.28433918952941895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,power_law_1.01,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,64,power_law_1.2,0.5760191917419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,power_law_1.2,0.3474112033843994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,power_law_1.01,0.06936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,power_law_1.2,0.4866879940032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,64,power_law_1.2,0.7400767803192139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,power_law_1.01,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,power_law_1.2,0.7441152095794678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,power_law_1.01,0.0937279999256134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,64,power_law_1.2,0.897766399383545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,power_law_1.2,1.474022388458252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,power_law_1.01,0.1004863977432251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,power_law_1.01,0.12877440452575684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,64,power_law_1.2,1.4173055648803712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,power_law_1.01,0.15190399885177613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,power_law_1.01,0.218451189994812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,64,power_law_1.2,2.84517765045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,power_law_1.01,0.26677761077880857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,power_law_1.01,0.36796159744262696
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,power_law_1.01,0.458406400680542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,power_law_1.01,0.5268928050994873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,power_law_1.01,0.8895808219909668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,power_law_1.01,1.7612096786499023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,power_law_1.2,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,power_law_1.2,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,power_law_1.2,0.03694080114364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,power_law_1.2,0.03285120129585266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,power_law_1.01,0.1215872049331665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,power_law_1.2,0.03284479975700379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,power_law_1.2,0.03387520015239716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,power_law_1.01,0.12280960083007812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,power_law_1.2,0.034483200311660765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,power_law_1.01,0.07344639897346497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,power_law_1.2,0.03427839875221252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,power_law_1.01,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,power_law_1.2,0.03551360070705414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,power_law_1.2,0.03612160086631775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,power_law_1.01,0.07242879867553711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,power_law_1.2,0.13100800514221192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,power_law_1.2,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,power_law_1.01,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,power_law_1.2,0.08554239869117737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,power_law_1.2,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,power_law_1.01,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,power_law_1.2,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,power_law_1.2,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,power_law_1.2,0.04184960126876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,power_law_1.2,0.07241600155830383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,power_law_1.2,0.0469760000705719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,power_law_1.01,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,power_law_1.2,0.07098879814147949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,power_law_1.2,0.04677119851112366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,power_law_1.01,0.0642304003238678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,power_law_1.2,0.0555840015411377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,power_law_1.2,0.0751039981842041
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,power_law_1.2,0.0717631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,power_law_1.01,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,power_law_1.2,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,power_law_1.2,0.07749760150909424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,power_law_1.01,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,power_law_1.2,0.06279680132865906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,power_law_1.2,0.09981439709663391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,power_law_1.01,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,power_law_1.2,0.06343039870262146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,power_law_1.2,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,power_law_1.2,0.1319551944732666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,power_law_1.01,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,power_law_1.2,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,power_law_1.2,0.15162880420684816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,power_law_1.01,0.07774080038070678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,power_law_1.2,0.0685375988483429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,power_law_1.2,0.21531519889831544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,power_law_1.01,0.08492159843444824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,power_law_1.2,0.07242239713668823
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,power_law_1.2,0.2718400001525879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,power_law_1.01,0.08961920142173767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,power_law_1.2,0.40147838592529295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,power_law_1.2,0.07345920205116271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,power_law_1.2,0.44202880859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,power_law_1.01,0.10805759429931641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,power_law_1.2,0.0779583990573883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,power_law_1.2,0.5792511940002442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,power_law_1.01,0.11910400390625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,power_law_1.2,0.08512639999389648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,power_law_1.2,0.8407808303833008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,power_law_1.01,0.15066239833831788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,power_law_1.2,0.08716800212860107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,power_law_1.2,1.8029375076293945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,power_law_1.01,0.15947519540786742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,power_law_1.2,0.09188479781150818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,power_law_1.01,0.19939199686050416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,power_law_1.2,0.11789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,power_law_1.01,0.24035840034484862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,power_law_1.2,0.14165120124816893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,power_law_1.01,0.3534080028533936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,power_law_1.2,0.17851519584655762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,power_law_1.01,0.3992831945419312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,power_law_1.2,0.18138879537582397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,power_law_1.01,0.558406400680542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,power_law_1.2,0.24364800453186036
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,power_law_1.2,0.310809588432312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,power_law_1.01,0.6761792182922364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,power_law_1.2,0.4871551990509033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,power_law_1.01,0.8965375900268555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,power_law_1.2,0.5522816181182861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,power_law_1.01,1.3772095680236816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,power_law_1.01,0.12295680046081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,power_law_1.2,0.8834303855895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,power_law_1.01,2.9265024185180666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,power_law_1.01,0.12910720109939575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,power_law_1.2,1.1128640174865723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,power_law_1.01,0.07256960272789001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,power_law_1.2,1.5564096450805665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,power_law_1.01,0.08097919821739197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,power_law_1.2,2.521433639526367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,power_law_1.01,0.07088639736175537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,power_law_1.01,0.0828224003314972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,power_law_1.2,5.577664184570312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,power_law_1.01,0.0832256019115448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,power_law_1.01,0.060083198547363284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,power_law_1.01,0.06090239882469177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,power_law_1.01,0.06172159910202026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,power_law_1.01,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,power_law_1.01,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,power_law_1.2,0.11564799547195434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,power_law_1.01,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,power_law_1.2,0.12691199779510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,power_law_1.01,0.06869760155677795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,power_law_1.2,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,power_law_1.01,0.07831680178642272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,power_law_1.2,0.07160959839820862
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,power_law_1.01,0.08119040131568908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,power_law_1.2,0.06833279728889466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,power_law_1.01,0.08732159733772278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,power_law_1.2,0.05848960280418396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,power_law_1.01,0.06650239825248719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,power_law_1.01,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,power_law_1.01,0.11004159450531006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,power_law_1.01,0.049497601389884946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,power_law_1.01,0.12910079956054688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,power_law_1.2,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,power_law_1.01,0.05318400263786316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,power_law_1.2,0.061791998147964475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,power_law_1.01,0.1463104009628296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,power_law_1.01,0.056467199325561525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,power_law_1.01,0.18031359910964967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,power_law_1.01,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,power_law_1.01,0.21184000968933106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,power_law_1.01,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,power_law_1.01,0.2859839916229248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,power_law_1.01,0.058310401439666745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,power_law_1.01,0.342905592918396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,power_law_1.01,0.05891839861869812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,power_law_1.01,0.4891456127166748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,power_law_1.01,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,power_law_1.01,0.5972864151000976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,power_law_1.01,0.06343039870262146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,power_law_1.01,0.7817855834960937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,power_law_1.01,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,power_law_1.01,1.2350079536437988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,power_law_1.01,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,power_law_1.01,0.07406719923019409
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,power_law_1.01,2.3894399642944335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,power_law_1.01,0.08000640273094177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,power_law_1.01,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,power_law_1.01,0.09455999732017517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,power_law_1.01,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,power_law_1.01,0.12732800245285034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,power_law_1.01,0.14035199880599974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,power_law_1.01,0.17790080308914186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,power_law_1.01,0.1969599962234497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,power_law_1.01,0.2645312070846558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,power_law_1.01,0.337446403503418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,power_law_1.01,0.18154239654541016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,power_law_1.2,0.1198848009109497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,power_law_1.01,0.2577343940734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,power_law_1.01,0.5117184162139893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,power_law_1.2,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,power_law_1.01,0.3789439916610718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,power_law_1.01,0.5702976226806641
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,power_law_1.01,0.4932544231414795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,power_law_1.2,0.07585279941558838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,power_law_1.01,0.7142720222473145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,power_law_1.01,0.6429440021514893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,power_law_1.2,0.07217280268669128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,power_law_1.01,1.467289638519287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,power_law_1.01,1.0626367568969726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,power_law_1.2,0.05496320128440857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,power_law_1.2,0.05886719822883606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,power_law_1.01,2.119795227050781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,power_law_1.2,0.059468799829483034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,power_law_1.2,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,power_law_1.2,0.06213759779930115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,power_law_1.2,0.06275839805603027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,power_law_1.2,0.06520320177078247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,power_law_1.2,0.06663680076599121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,power_law_1.2,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,power_law_1.01,0.08098559975624084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,power_law_1.2,0.08036479949951172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,power_law_1.01,0.09287040233612061
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,power_law_1.2,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,power_law_1.2,0.08636800050735474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,power_law_1.01,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,power_law_1.2,0.10084480047225952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,power_law_1.01,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,power_law_1.2,0.11066880226135253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,power_law_1.2,0.06033920049667359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,power_law_1.01,0.059084802865982056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,power_law_1.2,0.13585920333862306
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,power_law_1.2,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,power_law_1.01,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,power_law_1.2,0.1675968050956726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,power_law_1.01,0.06173440217971802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,power_law_1.2,0.22616961002349853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,power_law_1.2,0.055232000350952146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,power_law_1.01,0.0639743983745575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,power_law_1.2,0.2319103956222534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,power_law_1.2,0.05748479962348938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,power_law_1.01,0.06418560147285461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,power_law_1.2,0.31568639278411864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,power_law_1.01,0.06540160179138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,power_law_1.2,0.420531177520752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,power_law_1.01,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,power_law_1.2,0.5890816211700439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,power_law_1.01,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,power_law_1.2,0.7105152130126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,power_law_1.01,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,power_law_1.2,0.9308927536010743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,power_law_1.01,0.07525759935379028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,power_law_1.01,0.08241279721260071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,power_law_1.2,1.4537535667419434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,power_law_1.01,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,power_law_1.01,0.0881600022315979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,power_law_1.2,2.9061887741088865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,power_law_1.01,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,power_law_1.01,0.11191680431365966
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,power_law_1.01,0.12208000421524048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,power_law_1.01,0.1530303955078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,power_law_1.01,0.1954751968383789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,power_law_1.01,0.22373759746551514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,power_law_1.01,0.2911168098449707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,power_law_1.01,0.33923840522766113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,power_law_1.01,0.4821311950683594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,power_law_1.01,0.5866367816925049
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,power_law_1.01,0.7208000183105469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,power_law_1.01,0.06581760048866273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,power_law_1.01,1.06627197265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,power_law_1.01,0.07827839851379395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,power_law_1.01,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,power_law_1.01,2.2471359252929686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,power_law_1.01,0.05086719989776611
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,power_law_1.01,0.056569600105285646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,power_law_1.01,0.060083198547363284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,power_law_1.01,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,power_law_1.01,0.06516479849815368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,power_law_1.01,0.06540799736976624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,power_law_1.01,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,power_law_1.01,0.06705920100212097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,power_law_1.01,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,power_law_1.01,0.06848639845848084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,power_law_1.01,0.07585920095443725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,power_law_1.01,0.07871999740600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,power_law_1.2,0.06829439997673034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,power_law_1.01,0.08158720135688782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,power_law_1.2,0.07505279779434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,power_law_1.01,0.08691840171813965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,power_law_1.2,0.05804799795150757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,power_law_1.01,0.10124800205230713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,power_law_1.2,0.052934402227401735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,power_law_1.01,0.10740480422973633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,power_law_1.2,0.05743359923362732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,power_law_1.01,0.1340224027633667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,power_law_1.2,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,power_law_1.2,0.06357759833335877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,power_law_1.01,0.15983359813690184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,power_law_1.2,0.06439039707183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,power_law_1.01,0.19178240299224852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,power_law_1.2,0.06521599888801574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,power_law_1.01,0.21470720767974855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,power_law_1.2,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,power_law_1.01,0.31322879791259767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,power_law_1.2,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,power_law_1.01,0.38382079601287844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,power_law_1.2,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,power_law_1.01,0.4895616054534912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,power_law_1.2,0.07238399982452393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,power_law_1.01,0.6384384155273437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,power_law_1.2,0.07444480061531067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,power_law_1.01,0.8272383689880372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,power_law_1.2,0.08365439772605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,power_law_1.2,0.08508800268173218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,power_law_1.01,1.1412351608276368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,power_law_1.2,0.09020159840583801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,power_law_1.01,2.4234495162963867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,power_law_1.2,0.1020799994468689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,power_law_1.2,0.11552000045776367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,power_law_1.2,0.144268798828125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,power_law_1.2,0.16147840023040771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,power_law_1.2,0.2067392110824585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,power_law_1.2,0.2577343940734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,power_law_1.2,0.35317120552062986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,power_law_1.2,0.4070335865020752
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,power_law_1.2,0.6226880073547363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,power_law_1.2,0.7133632183074952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,power_law_1.2,0.9300864219665528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,power_law_1.2,1.460262393951416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,power_law_1.2,0.06689919829368592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,power_law_1.2,2.8234432220458983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,power_law_1.01,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,power_law_1.01,0.06438400149345398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,power_law_1.2,0.07119359970092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,power_law_1.01,0.052108800411224364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,power_law_1.2,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,power_law_1.01,0.05372160077095032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,power_law_1.2,0.08367999792098998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,power_law_1.01,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,power_law_1.2,0.09208319783210754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,power_law_1.01,0.06275200247764587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,power_law_1.2,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,power_law_1.01,0.0664255976676941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,power_law_1.2,0.12197760343551636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,power_law_1.01,0.0686847984790802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,power_law_1.2,0.15434880256652833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,power_law_1.01,0.07032960057258605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,power_law_1.2,0.17482880353927613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,power_law_1.01,0.07237759828567505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,power_law_1.2,0.2599551916122437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,power_law_1.01,0.07524480223655701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,power_law_1.2,0.2473344087600708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,power_law_1.01,0.07419520020484924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,power_law_1.2,0.34767999649047854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,power_law_1.2,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,power_law_1.01,0.07626879811286927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,power_law_1.2,0.42897920608520507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,power_law_1.2,0.06030719876289368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,power_law_1.01,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,power_law_1.2,0.6450431823730469
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,power_law_1.2,0.0531391978263855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,power_law_1.2,0.8463552474975586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,power_law_1.2,0.05518720149993896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,power_law_1.01,0.08979200124740601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,power_law_1.2,1.0362112045288085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,power_law_1.2,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,power_law_1.01,0.09839360117912292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,power_law_1.2,0.06317440271377564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,power_law_1.2,1.6260416030883789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,power_law_1.01,0.11148799657821655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,power_law_1.2,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,power_law_1.01,0.12418559789657593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,power_law_1.2,4.045126342773438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,power_law_1.2,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,power_law_1.01,0.1487615942955017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,power_law_1.2,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,power_law_1.01,0.16679680347442627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,power_law_1.2,0.07137280106544494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,power_law_1.01,0.22779519557952882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,power_law_1.2,0.07383679747581481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,power_law_1.01,0.2642816066741943
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,power_law_1.2,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,power_law_1.01,0.35951359272003175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,power_law_1.2,0.07628160119056701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,power_law_1.01,0.44695677757263186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,power_law_1.2,0.08201599717140198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,power_law_1.01,0.6613247871398926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,power_law_1.2,0.08876799941062927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,power_law_1.01,0.03147520124912262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,power_law_1.01,0.7703231811523438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,power_law_1.2,0.09348480105400085
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,power_law_1.01,0.03126400113105774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,power_law_1.01,0.9394944190979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,power_law_1.2,0.09962239861488342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,power_law_1.01,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,power_law_1.01,1.5796992301940918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,power_law_1.2,0.11601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,power_law_1.01,0.032492798566818235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,power_law_1.2,0.12583680152893068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,power_law_1.01,2.8267135620117188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,power_law_1.01,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,power_law_1.2,0.15779199600219726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,power_law_1.01,0.03452799916267395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,power_law_1.2,0.1729472041130066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,power_law_1.01,0.03678719997406006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,power_law_1.2,0.23601920604705812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,power_law_1.01,0.04232319891452789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,power_law_1.2,0.29541759490966796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,power_law_1.01,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,power_law_1.2,0.38692479133605956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,power_law_1.01,0.04762240052223206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,power_law_1.01,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,power_law_1.2,0.5272511959075927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,power_law_1.2,0.6756991863250732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,power_law_1.01,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,power_law_1.2,0.03162240087985992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,power_law_1.2,0.8964672088623047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,power_law_1.01,0.04355199933052063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,power_law_1.2,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,power_law_1.2,0.06280320286750793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,power_law_1.2,1.0871616363525392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,power_law_1.01,0.045388799905776975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,power_law_1.2,0.03223679959774017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,power_law_1.2,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,power_law_1.01,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,power_law_1.2,1.6800512313842773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,power_law_1.2,0.03243519961833954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,power_law_1.2,0.06506879925727845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,power_law_1.01,0.04989440143108368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,power_law_1.2,0.03326080143451691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,power_law_1.2,0.0660863995552063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,power_law_1.2,3.2406272888183594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,power_law_1.01,0.06053760051727295
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,power_law_1.2,0.03326080143451691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,power_law_1.2,0.07017599940299987
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,power_law_1.01,0.0660863995552063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,power_law_1.2,0.03408640027046204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,power_law_1.01,0.08533759713172913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,power_law_1.2,0.07029759883880615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,power_law_1.2,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,power_law_1.01,0.11051520109176635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,power_law_1.2,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,power_law_1.2,0.08002560138702393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,power_law_1.2,0.044326400756835936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,power_law_1.01,0.1395967960357666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,power_law_1.2,0.08204159736633301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,power_law_1.2,0.04963839948177338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,power_law_1.01,0.18301440477371217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,power_law_1.2,0.05127040147781372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,power_law_1.01,0.19571839570999144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,power_law_1.2,0.09824000000953674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,power_law_1.2,0.0529151976108551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,power_law_1.01,0.2624703884124756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,power_law_1.2,0.1082751989364624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,power_law_1.2,0.03939839899539947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,power_law_1.01,0.03265919983386993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,power_law_1.01,0.31529600620269777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,power_law_1.2,0.13917440176010132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,power_law_1.2,0.04309119880199432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,power_law_1.01,0.03163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,power_law_1.01,0.4115839958190918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,power_law_1.2,0.1547711968421936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,power_law_1.01,0.03163520097732544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,power_law_1.2,0.04390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,power_law_1.2,0.19982080459594725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,power_law_1.01,0.6499648094177246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,power_law_1.01,0.03245440125465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,power_law_1.2,0.05004799962043762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,power_law_1.2,0.21559040546417235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,power_law_1.01,0.031839999556541446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,power_law_1.2,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,power_law_1.01,1.2817728042602539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,power_law_1.01,0.03200640082359314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,power_law_1.2,0.06417919993400574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,power_law_1.2,0.2946432113647461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,power_law_1.01,0.03327359855175018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,power_law_1.2,0.08855680227279664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,power_law_1.2,0.38455679416656496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,power_law_1.01,0.03798399865627289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,power_law_1.2,0.09797120094299316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,power_law_1.2,0.5895423889160156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,power_law_1.01,0.042694398760795595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,power_law_1.2,0.13114880323410033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,power_law_1.2,0.7159103870391845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,power_law_1.01,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,power_law_1.2,0.19750399589538575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,power_law_1.01,0.04780800044536591
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,power_law_1.2,0.8117504119873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,power_law_1.2,0.276364803314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,power_law_1.2,0.2554624080657959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,power_law_1.2,1.5592767715454101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,power_law_1.01,0.05088000297546387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,power_law_1.2,0.38530559539794923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,power_law_1.2,0.030847999453544616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,power_law_1.01,0.037567999958992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,power_law_1.2,2.5845056533813477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,power_law_1.2,0.4707071781158447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,power_law_1.01,0.0416703999042511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,power_law_1.2,0.5882495880126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,power_law_1.2,0.030028799176216127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,power_law_1.01,0.04104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,power_law_1.2,0.030854400992393494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,power_law_1.01,0.04434559941291809
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,power_law_1.2,0.8739456176757813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,power_law_1.01,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,power_law_1.2,0.03208959996700287
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,power_law_1.2,1.798431968688965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,power_law_1.01,0.05477759838104248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,power_law_1.2,0.032902398705482484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,power_law_1.01,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,power_law_1.2,0.03310079872608185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,power_law_1.01,0.08590720295906067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,power_law_1.2,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,power_law_1.01,0.09511039853096008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,power_law_1.01,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,power_law_1.2,0.0427264004945755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,power_law_1.01,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,power_law_1.01,0.1536960005760193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,power_law_1.2,0.049081599712371825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,power_law_1.01,0.029420799016952513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,power_law_1.01,0.1670016050338745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,power_law_1.2,0.05113599896430969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,power_law_1.01,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,power_law_1.2,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,power_law_1.01,0.23539841175079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,power_law_1.01,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,power_law_1.2,0.04088320136070252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,power_law_1.01,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,power_law_1.01,0.28250880241394044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,power_law_1.2,0.03223679959774017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,power_law_1.2,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,power_law_1.01,0.03227519989013672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,power_law_1.01,0.4006847858428955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,power_law_1.2,0.029164800047874452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,power_law_1.2,0.04456959962844849
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,power_law_1.01,0.03332479894161224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,power_law_1.2,0.030803200602531434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,power_law_1.01,0.5165887832641601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,power_law_1.2,0.04376319944858551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,power_law_1.01,0.03290880024433136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,power_law_1.2,0.03080959916114807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,power_law_1.01,1.1080639839172364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,power_law_1.2,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,power_law_1.01,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,power_law_1.2,0.032025599479675294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,power_law_1.01,0.04273279905319214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,power_law_1.2,0.03345920145511627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,power_law_1.01,0.047244799137115476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,power_law_1.2,0.03446399867534637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,power_law_1.01,0.0490880012512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,power_law_1.2,0.037145599722862244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,power_law_1.01,0.051532799005508424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,power_law_1.2,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,power_law_1.01,0.037222400307655334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,power_law_1.2,0.043084800243377686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,power_law_1.01,0.04069760143756866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,power_law_1.2,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,power_law_1.01,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,power_law_1.2,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,power_law_1.01,0.04335359930992126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,power_law_1.2,0.052928000688552856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,power_law_1.01,0.04785279929637909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,power_law_1.2,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,power_law_1.01,0.05195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,power_law_1.2,0.041247999668121337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,power_law_1.01,0.03429119884967804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,power_law_1.01,0.03203839957714081
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,power_law_1.2,0.04288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,power_law_1.01,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,power_law_1.2,0.046367999911308286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,power_law_1.01,0.07285119891166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,power_law_1.01,0.0328575998544693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,power_law_1.2,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,power_law_1.01,0.09406080245971679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,power_law_1.2,0.05477759838104248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,power_law_1.01,0.11729279756546021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,power_law_1.2,0.07340800166130065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,power_law_1.01,0.1477952003479004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,power_law_1.2,0.08671360015869141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,power_law_1.01,0.17401599884033203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,power_law_1.01,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,power_law_1.2,0.11682560443878173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,power_law_1.01,0.24384000301361083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,power_law_1.01,0.035519999265670774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,power_law_1.2,0.13483519554138185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,power_law_1.01,0.30650880336761477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,power_law_1.01,0.0359360009431839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,power_law_1.2,0.20078721046447753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,power_law_1.01,0.413804817199707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,power_law_1.2,0.22147200107574463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,power_law_1.01,0.6434112071990967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,power_law_1.01,0.03818239867687225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,power_law_1.2,0.2865920066833496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,power_law_1.01,0.03961600065231323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,power_law_1.01,1.319871997833252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,power_law_1.2,0.42320637702941893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,power_law_1.01,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,power_law_1.01,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,power_law_1.2,0.7043712139129639
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,power_law_1.01,0.04679040014743805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,power_law_1.2,1.01977596282959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,power_law_1.01,0.052723199129104614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,power_law_1.01,0.06195840239524841
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,power_law_1.2,2.0710079193115236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,power_law_1.01,0.07541760206222534
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,power_law_1.01,0.08180480003356934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,power_law_1.01,0.10289920568466186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,power_law_1.01,0.12338559627532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,power_law_1.01,0.1704767942428589
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,power_law_1.01,0.20774400234222412
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,power_law_1.2,0.030451199412345885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,power_law_1.01,0.27760000228881837
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,power_law_1.2,0.030649599432945252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,power_law_1.01,0.3777472019195557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,power_law_1.2,0.030656000971794127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,power_law_1.01,0.4236095905303955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,power_law_1.2,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,power_law_1.01,0.6054656028747558
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,power_law_1.2,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,power_law_1.01,0.0357120007276535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,power_law_1.01,1.2630911827087403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,power_law_1.01,0.030796799063682555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,power_law_1.2,0.0341376006603241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,power_law_1.01,0.03080959916114807
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,power_law_1.2,0.0341376006603241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,power_law_1.01,0.031219199299812317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,power_law_1.2,0.035359999537467955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,power_law_1.01,0.032364800572395325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,power_law_1.2,0.03535360097885132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,power_law_1.01,0.034892800450325015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,power_law_1.01,0.03550719916820526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,power_law_1.01,0.03612799942493439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,power_law_1.2,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,power_law_1.2,0.03883520066738129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,power_law_1.01,0.03735679984092712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,power_law_1.2,0.04376960098743439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,power_law_1.01,0.03776000142097473
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,power_law_1.2,0.04417920112609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,power_law_1.01,0.03775359988212586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,power_law_1.2,0.03612799942493439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,power_law_1.01,0.03938559889793396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,power_law_1.2,0.055852800607681274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,power_law_1.2,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,power_law_1.01,0.040633600950241086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,power_law_1.2,0.06384000182151794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,power_law_1.2,0.03162879943847656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,power_law_1.01,0.045132800936698914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,power_law_1.2,0.0804095983505249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,power_law_1.2,0.03244799971580505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,power_law_1.01,0.04513919949531555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,power_law_1.2,0.09619839787483216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,power_law_1.2,0.03349120020866394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,power_law_1.01,0.048825600743293764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,power_law_1.2,0.12260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,power_law_1.2,0.036748799681663516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,power_law_1.01,0.05432959794998169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,power_law_1.2,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,power_law_1.2,0.14514559507369995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,power_law_1.01,0.06275200247764587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,power_law_1.2,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,power_law_1.2,0.19367040395736695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,power_law_1.01,0.07912319898605347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,power_law_1.2,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,power_law_1.2,0.27681920528411863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,power_law_1.2,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,power_law_1.01,0.08936960101127625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,power_law_1.2,0.3265984058380127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,power_law_1.2,0.0385919988155365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,power_law_1.01,0.1172287940979004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,power_law_1.2,0.45026559829711915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,power_law_1.2,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,power_law_1.01,0.1381183981895447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,power_law_1.2,0.48551039695739745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,power_law_1.2,0.04044159948825836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,power_law_1.01,0.2120512008666992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,power_law_1.2,0.917843246459961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,power_law_1.2,0.04186240136623383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,power_law_1.01,0.24440319538116456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,power_law_1.2,0.04576640129089356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,power_law_1.01,0.32673919200897217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,power_law_1.2,1.892697525024414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,power_law_1.2,0.048825600743293764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,power_law_1.01,0.4172544002532959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,power_law_1.2,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,power_law_1.01,0.5042943954467773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,power_law_1.2,0.05989120006561279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,power_law_1.01,0.7342976093292236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,power_law_1.2,0.06398720145225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,power_law_1.2,0.08652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,power_law_1.01,1.7574655532836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,power_law_1.2,0.10044159889221191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,power_law_1.2,0.1205183982849121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,power_law_1.2,0.15489920377731323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,power_law_1.2,0.2141184091567993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,power_law_1.2,0.2667455911636353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,power_law_1.2,0.3693311929702759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,power_law_1.01,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,power_law_1.2,0.5247807979583741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,power_law_1.01,0.05237119793891907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,power_law_1.2,0.7056128025054932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,power_law_1.01,0.05237119793891907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,power_law_1.2,0.9820992469787597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,power_law_1.01,0.0531711995601654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,power_law_1.01,0.05562880039215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,power_law_1.2,2.0079423904418947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,power_law_1.2,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,power_law_1.01,0.05011199712753296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,power_law_1.2,0.052934402227401735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,power_law_1.01,0.05175039768218994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,power_law_1.2,0.05373439788818359
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,power_law_1.01,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,power_law_1.2,0.05292159914970398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,power_law_1.01,0.05257599949836731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,power_law_1.2,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,power_law_1.01,0.054016000032424925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,power_law_1.2,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,power_law_1.01,0.05728639960289002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,power_law_1.2,0.05251200199127197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,power_law_1.01,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,power_law_1.2,0.05353599786758423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,power_law_1.01,0.058508801460266116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,power_law_1.2,0.05434880256652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,power_law_1.01,0.06035199761390686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,power_law_1.2,0.05620480179786682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,power_law_1.01,0.0695680022239685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,power_law_1.2,0.057222402095794676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,power_law_1.01,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,power_law_1.01,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,power_law_1.2,0.060102397203445436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,power_law_1.01,0.07919999957084656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,power_law_1.01,0.056428802013397214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,power_law_1.2,0.06254720091819763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,power_law_1.01,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,power_law_1.01,0.04883840084075928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,power_law_1.2,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,power_law_1.01,0.09721599817276001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,power_law_1.01,0.050886398553848265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,power_law_1.2,0.07114239931106567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,power_law_1.01,0.05294719934463501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,power_law_1.01,0.11565439701080323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,power_law_1.2,0.07175679802894593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,power_law_1.01,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,power_law_1.01,0.12609280347824098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,power_law_1.01,0.057631999254226685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,power_law_1.2,0.08117759823799134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,power_law_1.01,0.15352959632873536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,power_law_1.01,0.057030397653579715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,power_law_1.2,0.09552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,power_law_1.01,0.18405120372772216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,power_law_1.01,0.058259201049804685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,power_law_1.2,0.10739200115203858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,power_law_1.01,0.25511679649353025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,power_law_1.01,0.05928320288658142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,power_law_1.2,0.1270591974258423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,power_law_1.01,0.32556800842285155
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,power_law_1.01,0.06255360245704651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,power_law_1.2,0.1425920009613037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,power_law_1.01,0.4404607772827148
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,power_law_1.01,0.06195840239524841
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,power_law_1.2,0.1860416054725647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,power_law_1.01,0.5362688064575195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,power_law_1.01,0.06540799736976624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,power_law_1.2,0.21020159721374512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,power_law_1.01,0.717523193359375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,power_law_1.01,0.06911360025405884
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,power_law_1.2,0.28558080196380614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,power_law_1.01,1.0194175720214844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,power_law_1.01,0.07525119781494141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,power_law_1.2,0.3863359928131104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,power_law_1.01,0.07708160281181335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,power_law_1.2,0.6161151885986328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,power_law_1.01,2.2197568893432615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,power_law_1.01,0.08241919875144958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,power_law_1.2,0.724832010269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,power_law_1.01,0.09612799882888794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,power_law_1.2,0.8219327926635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,power_law_1.01,0.10290559530258178
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,power_law_1.01,0.1344256043434143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,power_law_1.2,1.6288639068603517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,power_law_1.01,0.1356735944747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,power_law_1.2,3.3667648315429686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,power_law_1.01,0.1741696000099182
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,power_law_1.2,0.09002879858016968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,power_law_1.01,0.20714879035949707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,power_law_1.2,0.11912319660186768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,power_law_1.01,0.2736959934234619
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,power_law_1.2,0.12814079523086547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,power_law_1.01,0.34908161163330076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,power_law_1.2,0.2104640007019043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,power_law_1.01,0.47029762268066405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,power_law_1.2,0.2223423957824707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,power_law_1.2,0.35852799415588377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,power_law_1.2,0.06280320286750793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,power_law_1.01,0.5751616001129151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,power_law_1.2,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,power_law_1.2,0.537113618850708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,power_law_1.01,0.7629631996154785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,power_law_1.2,0.04682239890098572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,power_law_1.2,0.6088064193725586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,power_law_1.01,1.0046208381652832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,power_law_1.2,0.0474368005990982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,power_law_1.2,0.8248576164245606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,power_law_1.2,0.04990079998970032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,power_law_1.01,2.436934471130371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,power_law_1.2,0.05235840082168579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,power_law_1.2,1.8328832626342773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,power_law_1.2,0.05400320291519165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,power_law_1.2,0.05543680191040039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,power_law_1.2,0.05666559934616089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,power_law_1.2,0.05975040197372437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,power_law_1.2,0.06097279787063599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,power_law_1.2,0.06343039870262146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,power_law_1.2,0.06424959897994995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,power_law_1.2,0.07530239820480347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,power_law_1.2,0.08227840065956116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,power_law_1.2,0.09804159998893738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,power_law_1.01,0.14553600549697876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,power_law_1.2,0.11134079694747925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,power_law_1.2,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,power_law_1.01,0.1053887963294983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,power_law_1.2,0.1375615954399109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,power_law_1.2,0.049644801020622256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,power_law_1.01,0.08430079817771911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,power_law_1.2,0.1496448040008545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,power_law_1.2,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,power_law_1.01,0.0775551974773407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,power_law_1.2,0.19367680549621583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,power_law_1.2,0.05231999754905701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,power_law_1.01,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,power_law_1.2,0.23708798885345458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,power_law_1.2,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,power_law_1.2,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,power_law_1.2,0.2971776008605957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,power_law_1.01,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,power_law_1.2,0.06092159748077393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,power_law_1.2,0.40174078941345215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,power_law_1.01,0.07180799841880799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,power_law_1.2,0.5883264064788818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,power_law_1.01,0.07284479737281799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,power_law_1.2,0.061740797758102414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,power_law_1.2,0.7109888076782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,power_law_1.01,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,power_law_1.2,0.0629696011543274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,power_law_1.2,0.9792639732360839
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,power_law_1.2,0.06829439997673034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,power_law_1.01,0.07448319792747497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,power_law_1.2,1.560921573638916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,power_law_1.2,0.07198079824447631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,power_law_1.01,0.07672960162162781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,power_law_1.2,0.07258880138397217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,power_law_1.01,0.07794560194015503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,power_law_1.2,3.7090625762939453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,power_law_1.2,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,power_law_1.01,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,power_law_1.2,0.08262400031089782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,power_law_1.2,0.0871295988559723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,power_law_1.01,0.08042240142822266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,power_law_1.2,0.08980479836463928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,power_law_1.01,0.08675839900970458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,power_law_1.2,0.10309120416641235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,power_law_1.01,0.0847104012966156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,power_law_1.2,0.11662720441818238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,power_law_1.01,0.09208959937095643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,power_law_1.2,0.14529279470443726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,power_law_1.01,0.10027519464492798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,power_law_1.2,0.1774399995803833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,power_law_1.2,0.20815999507904054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,power_law_1.01,0.12035839557647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,power_law_1.2,0.2511807918548584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,power_law_1.01,0.1461632013320923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,power_law_1.2,0.36586239337921145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,power_law_1.2,0.15045759677886963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,power_law_1.01,0.15372159481048583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,power_law_1.2,0.4490047931671143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,power_law_1.2,0.14369280338287355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,power_law_1.01,0.1946943998336792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,power_law_1.2,0.647872018814087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,power_law_1.2,0.08472319841384887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,power_law_1.01,0.2342207908630371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,power_law_1.2,0.791648006439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,power_law_1.2,0.09148799777030944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,power_law_1.01,0.29750399589538573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,power_law_1.2,1.1715328216552734
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,power_law_1.2,0.08227199912071229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,power_law_1.01,0.36487679481506347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,power_law_1.2,1.5174464225769042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,power_law_1.2,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,power_law_1.01,0.5231808185577392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,power_law_1.2,0.0695743978023529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,power_law_1.2,2.8402496337890626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,power_law_1.01,0.6351871967315674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,power_law_1.01,0.8101056098937989
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,power_law_1.2,0.06588159799575806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,power_law_1.01,1.2318016052246095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,power_law_1.2,0.0720255970954895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,power_law_1.2,0.07857919931411743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,power_law_1.01,2.460799980163574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,power_law_1.2,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,power_law_1.2,0.0789247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,power_law_1.2,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,power_law_1.2,0.08329600095748901
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,power_law_1.2,0.08636159896850586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,power_law_1.2,0.10008319616317748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,power_law_1.01,0.11109119653701782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,power_law_1.2,0.1121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,power_law_1.01,0.0881600022315979
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,power_law_1.2,0.12751359939575196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,power_law_1.01,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,power_law_1.2,0.15987199544906616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,power_law_1.01,0.05764480233192444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,power_law_1.2,0.16193920373916626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,power_law_1.01,0.06213759779930115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,power_law_1.2,0.10396159887313842
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,power_law_1.2,0.21743359565734863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,power_law_1.01,0.06440320014953613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,power_law_1.2,0.0859391987323761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,power_law_1.01,0.06767359972000123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,power_law_1.2,0.26820480823516846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,power_law_1.2,0.0732479989528656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,power_law_1.01,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,power_law_1.2,0.34664320945739746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,power_law_1.2,0.05624319911003113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,power_law_1.2,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,power_law_1.2,0.43144960403442384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,power_law_1.01,0.07134720087051391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,power_law_1.2,0.06402559876441956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,power_law_1.2,0.6186367988586425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,power_law_1.01,0.07710080146789551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,power_law_1.2,0.06136959791183472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,power_law_1.2,0.8313983917236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,power_law_1.01,0.07505279779434204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,power_law_1.2,0.06792960166931153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,power_law_1.2,1.0197695732116698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,power_law_1.01,0.07771520018577575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,power_law_1.2,0.06709759831428527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,power_law_1.2,1.623583984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,power_law_1.01,0.07670400142669678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,power_law_1.2,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,power_law_1.01,0.08835840225219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,power_law_1.2,3.3869182586669924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,power_law_1.2,0.07180799841880799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,power_law_1.01,0.08979840278625488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,power_law_1.01,0.09409279823303222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,power_law_1.2,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,power_law_1.01,0.10515199899673462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,power_law_1.2,0.07978879809379577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,power_law_1.2,0.08451200127601624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,power_law_1.01,0.11068799495697021
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,power_law_1.2,0.08677120208740234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,power_law_1.01,0.1358847975730896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,power_law_1.01,0.15123840570449829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,power_law_1.2,0.09249920248985291
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,power_law_1.2,0.1072383999824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,power_law_1.01,0.19545600414276124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,power_law_1.2,0.12157440185546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,power_law_1.01,0.21800320148468016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,power_law_1.2,0.1469696044921875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,power_law_1.01,0.3027776002883911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,power_law_1.01,0.08554239869117737
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,power_law_1.2,0.15474560260772705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,power_law_1.01,0.36482560634613037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,power_law_1.01,0.09218559861183166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,power_law_1.2,0.1989824056625366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,power_law_1.01,0.5100351810455322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,power_law_1.01,0.07277439832687378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,power_law_1.2,0.23626880645751952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,power_law_1.01,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,power_law_1.01,0.6308671951293945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,power_law_1.2,0.3241152048110962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,power_law_1.01,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,power_law_1.01,0.7887807846069336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,power_law_1.2,0.4283711910247803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,power_law_1.01,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,power_law_1.01,1.178502368927002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,power_law_1.01,0.06403840184211732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,power_law_1.2,0.6083648204803467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,power_law_1.01,2.3878400802612303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,power_law_1.01,0.0689791977405548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,power_law_1.2,0.6954175949096679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,power_law_1.01,0.07037439942359924
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,power_law_1.2,0.8891584396362304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,power_law_1.01,0.06935039758682252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,power_law_1.2,1.4386431694030761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,power_law_1.01,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,power_law_1.2,2.7276607513427735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,power_law_1.01,0.07939199805259704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,power_law_1.01,0.07858560085296631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,power_law_1.01,0.07886719703674316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,power_law_1.01,0.0904640018939972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,power_law_1.01,0.08922240138053894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,power_law_1.01,0.09230080246925354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,power_law_1.2,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,power_law_1.01,0.10293760299682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,power_law_1.2,0.09758080244064331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,power_law_1.01,0.11461759805679321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,power_law_1.2,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,power_law_1.01,0.13834240436553955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,power_law_1.2,0.057030397653579715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,power_law_1.01,0.1584447979927063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,power_law_1.01,0.19612159729003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,power_law_1.2,0.0629696011543274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,power_law_1.01,0.06382079720497132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,power_law_1.01,0.22439041137695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,power_law_1.2,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,power_law_1.01,0.056601601839065555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,power_law_1.01,0.07979519963264466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,power_law_1.01,0.30076799392700193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,power_law_1.01,0.060915201902389526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,power_law_1.2,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,power_law_1.01,0.08165119886398316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,power_law_1.01,0.04963200092315674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,power_law_1.01,0.3767616033554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,power_law_1.2,0.0701312005519867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,power_law_1.01,0.05685120224952698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,power_law_1.01,0.05046399831771851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,power_law_1.01,0.5465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,power_law_1.01,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,power_law_1.01,0.052102398872375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,power_law_1.2,0.07465599775314331
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,power_law_1.01,0.06670079827308655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,power_law_1.01,0.6614272117614746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,power_law_1.01,0.057222402095794676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,power_law_1.2,0.077920001745224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,power_law_1.01,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,power_law_1.01,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,power_law_1.01,0.804377555847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,power_law_1.2,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,power_law_1.01,0.059680002927780154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,power_law_1.01,1.2346559524536134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,power_law_1.2,0.08076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,power_law_1.01,0.061318397521972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,power_law_1.01,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,power_law_1.01,0.063372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,power_law_1.2,0.08937600255012512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,power_law_1.01,2.5640256881713865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,power_law_1.01,0.07263360023498536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,power_law_1.01,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,power_law_1.2,0.09102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,power_law_1.01,0.0773311972618103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,power_law_1.01,0.06727039813995361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,power_law_1.2,0.09798399806022644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,power_law_1.01,0.0773311972618103
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,power_law_1.01,0.07052800059318542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,power_law_1.2,0.10883840322494506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,power_law_1.01,0.08184319734573364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,power_law_1.01,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,power_law_1.2,0.11724159717559815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,power_law_1.01,0.08223999738693237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,power_law_1.01,0.07914239764213563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,power_law_1.2,0.14672640562057496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,power_law_1.01,0.08405759930610657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,power_law_1.01,0.09042559862136841
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,power_law_1.01,0.0863103985786438
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,power_law_1.2,0.1676095962524414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,power_law_1.01,0.09242240190505982
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,power_law_1.01,0.10249600410461426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,power_law_1.2,0.21185920238494874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,power_law_1.01,0.09699199795722961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,power_law_1.01,0.12091519832611083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,power_law_1.2,0.23233919143676757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,power_law_1.01,0.10868480205535888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,power_law_1.01,0.143449604511261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,power_law_1.01,0.11646080017089844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,power_law_1.2,0.32695679664611815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,power_law_1.01,0.1573632001876831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,power_law_1.2,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,power_law_1.01,0.1434816002845764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,power_law_1.2,0.415008020401001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,power_law_1.01,0.20140159130096436
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,power_law_1.2,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,power_law_1.01,0.1695039987564087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,power_law_1.2,0.5895103931427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,power_law_1.01,0.24174718856811522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,power_law_1.2,0.05891839861869812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,power_law_1.01,0.20758399963378907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,power_law_1.01,0.3224384069442749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,power_law_1.2,0.7039807796478271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,power_law_1.2,0.05236480236053467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,power_law_1.01,0.26248960494995116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,power_law_1.01,0.39084160327911377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,power_law_1.2,0.05912960171699524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,power_law_1.2,0.9157504081726074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,power_law_1.01,0.5690176010131835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,power_law_1.01,0.3308864116668701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,power_law_1.2,0.061375999450683595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,power_law_1.2,1.4721983909606933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,power_law_1.01,0.773203182220459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,power_law_1.01,0.41484799385070803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,power_law_1.2,0.06382719874382019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,power_law_1.2,3.023859214782715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,power_law_1.01,0.828486442565918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,power_law_1.01,0.5719423770904541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,power_law_1.2,0.07324159741401673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,power_law_1.01,1.309171199798584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,power_law_1.2,0.07319039702415467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,power_law_1.01,0.7203519821166993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,power_law_1.2,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,power_law_1.01,0.9100607872009278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,power_law_1.01,2.8722047805786133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,power_law_1.2,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,power_law_1.01,1.3496959686279297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,power_law_1.2,0.0794048011302948
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,power_law_1.01,2.7292863845825197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,power_law_1.2,0.07817599773406983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,power_law_1.2,0.0830784022808075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,power_law_1.2,0.09004799723625183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,power_law_1.2,0.09290879964828491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,power_law_1.2,0.09864959716796876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,power_law_1.2,0.11278719902038574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,power_law_1.01,0.030643200874328612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,power_law_1.2,0.12117760181427002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,power_law_1.01,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,power_law_1.01,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,power_law_1.2,0.15230720043182372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,power_law_1.01,0.03043839931488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,power_law_1.01,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,power_law_1.2,0.17605119943618774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,power_law_1.01,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,power_law_1.2,0.21414399147033691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,power_law_1.01,0.03208320140838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,power_law_1.2,0.05906559824943543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,power_law_1.01,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,power_law_1.01,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,power_law_1.2,0.26617600917816164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,power_law_1.2,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,power_law_1.01,0.03351039886474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,power_law_1.01,0.06152960062026978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,power_law_1.01,0.03454079926013946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,power_law_1.2,0.35177600383758545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,power_law_1.2,0.05803520083427429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,power_law_1.01,0.0689087986946106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,power_law_1.01,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,power_law_1.2,0.4457791805267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,power_law_1.2,0.05600000023841858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,power_law_1.01,0.035769599676132205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,power_law_1.01,0.0705344021320343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,power_law_1.01,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,power_law_1.2,0.6030655860900879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,power_law_1.2,0.060288000106811526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,power_law_1.01,0.07460479736328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,power_law_1.01,0.03760640025138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,power_law_1.2,0.825267219543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,power_law_1.01,0.0367680013179779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,power_law_1.2,0.06377599835395813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,power_law_1.01,0.07668480277061462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,power_law_1.01,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,power_law_1.01,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,power_law_1.2,0.06807680130004883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,power_law_1.2,1.0419455528259278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,power_law_1.01,0.04190079867839813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,power_law_1.01,0.04394879937171936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,power_law_1.01,0.08468480110168457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,power_law_1.2,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,power_law_1.2,1.4656831741333007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,power_law_1.01,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,power_law_1.01,0.08488320112228394
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,power_law_1.2,0.07729920148849487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,power_law_1.01,0.05728639960289002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,power_law_1.2,2.9472063064575194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,power_law_1.01,0.08549759984016418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,power_law_1.01,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,power_law_1.2,0.07912960052490234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,power_law_1.01,0.07528960108757018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,power_law_1.01,0.09082239866256714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,power_law_1.2,0.08363519906997681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,power_law_1.01,0.10560640096664428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,power_law_1.01,0.09634559750556945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,power_law_1.01,0.1240447998046875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,power_law_1.2,0.08609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,power_law_1.01,0.17441920042037964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,power_law_1.01,0.10001280307769775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,power_law_1.2,0.08733440041542054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,power_law_1.01,0.21782400608062744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,power_law_1.01,0.10617599487304688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,power_law_1.01,0.3097791910171509
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,power_law_1.2,0.09059839844703674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,power_law_1.2,0.03351039886474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,power_law_1.01,0.3968192100524902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,power_law_1.01,0.12296960353851319
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,power_law_1.2,0.03187839984893799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,power_law_1.2,0.09715840220451355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,power_law_1.01,0.5039360046386718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,power_law_1.2,0.03043839931488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,power_law_1.01,0.1340288043022156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,power_law_1.2,0.10044159889221191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,power_law_1.01,0.8150272369384766
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,power_law_1.2,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,power_law_1.01,0.1618880033493042
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,power_law_1.2,0.0310591995716095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,power_law_1.2,0.11025919914245605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,power_law_1.01,1.5854911804199219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,power_law_1.01,0.18851200342178345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,power_law_1.2,0.033523198962211606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,power_law_1.2,0.12132480144500732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,power_law_1.2,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,power_law_1.01,0.24092159271240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,power_law_1.2,0.1381183981895447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,power_law_1.01,0.289247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,power_law_1.2,0.1717120051383972
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,power_law_1.01,0.4170688152313232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,power_law_1.2,0.20079360008239747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,power_law_1.01,0.506771183013916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,power_law_1.2,0.25525119304656985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,power_law_1.01,0.7023551940917969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,power_law_1.01,0.034329599142074584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,power_law_1.2,0.30892798900604246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,power_law_1.01,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,power_law_1.01,0.9054976463317871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,power_law_1.2,0.4232192039489746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,power_law_1.01,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,power_law_1.01,1.0928832054138184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,power_law_1.01,0.03473280072212219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,power_law_1.2,0.5407551765441895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,power_law_1.01,1.664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,power_law_1.01,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,power_law_1.2,0.7334720134735108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,power_law_1.01,0.0367680013179779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,power_law_1.01,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,power_law_1.01,3.1714048385620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,power_law_1.2,0.9554688453674316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,power_law_1.01,0.037625598907470706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,power_law_1.2,1.1227840423583983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,power_law_1.01,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,power_law_1.01,0.03780480027198792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,power_law_1.2,1.7230592727661134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,power_law_1.01,0.03883520066738129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,power_law_1.01,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,power_law_1.2,3.6623104095458983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,power_law_1.01,0.048588800430297854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,power_law_1.01,0.05356799960136414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,power_law_1.2,0.0361407995223999
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,power_law_1.01,0.050310397148132326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,power_law_1.2,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,power_law_1.01,0.059308797121047974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,power_law_1.2,0.03552640080451965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,power_law_1.01,0.0646399974822998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,power_law_1.2,0.035308799147605895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,power_law_1.01,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,power_law_1.2,0.03552640080451965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,power_law_1.01,0.11113599538803101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,power_law_1.2,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,power_law_1.01,0.14902399778366088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,power_law_1.2,0.03777920007705689
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,power_law_1.01,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,power_law_1.01,0.1725759983062744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,power_law_1.2,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,power_law_1.01,0.23953280448913575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,power_law_1.2,0.037363201379776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,power_law_1.01,0.06910719871520996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,power_law_1.2,0.03736959993839264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,power_law_1.01,0.2983167886734009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,power_law_1.01,0.05537279844284058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,power_law_1.2,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,power_law_1.01,0.42714881896972656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,power_law_1.01,0.05681920051574707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,power_law_1.2,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,power_law_1.01,0.5313727855682373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,power_law_1.2,0.04085119962692261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,power_law_1.01,0.6757760047912598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,power_law_1.01,0.053324800729751584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,power_law_1.2,0.04310399889945984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,power_law_1.01,1.076972770690918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,power_law_1.01,0.05496320128440857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,power_law_1.2,0.05170559883117676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,power_law_1.01,2.117363166809082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,power_law_1.2,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,power_law_1.01,0.05578879714012146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,power_law_1.2,0.05026559829711914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,power_law_1.01,0.05618559718132019
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,power_law_1.2,0.060096001625061034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,power_law_1.01,0.057811200618743896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,power_law_1.2,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,power_law_1.2,0.08570240139961242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,power_law_1.01,0.05783680081367493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,power_law_1.2,0.10515199899673462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,power_law_1.01,0.059680002927780154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,power_law_1.2,0.14179840087890624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,power_law_1.2,0.1753983974456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,power_law_1.01,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,power_law_1.2,0.24318718910217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,power_law_1.01,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,power_law_1.2,0.07100160121917724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,power_law_1.2,0.3015615940093994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,power_law_1.01,0.06418560147285461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,power_law_1.2,0.0818560004234314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,power_law_1.2,0.4395711898803711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,power_law_1.2,0.5297215938568115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,power_law_1.01,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,power_law_1.2,0.05583999752998352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,power_law_1.2,0.7011072158813476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,power_law_1.01,0.07216640114784241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,power_law_1.2,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,power_law_1.2,1.0353471755981445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,power_law_1.01,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,power_law_1.2,0.054604798555374146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,power_law_1.2,2.0411136627197264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,power_law_1.01,0.09388800263404846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,power_law_1.2,0.05514240264892578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,power_law_1.2,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,power_law_1.01,0.1045375943183899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,power_law_1.2,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,power_law_1.01,0.12992000579833984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,power_law_1.01,0.15408639907836913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,power_law_1.01,0.20447359085083008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,power_law_1.2,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,power_law_1.01,0.2536191940307617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,power_law_1.01,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,power_law_1.2,0.05971840023994446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,power_law_1.01,0.33615999221801757
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,power_law_1.01,0.05846400260925293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,power_law_1.2,0.061977601051330565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,power_law_1.01,0.41889281272888185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,power_law_1.01,0.05455999970436096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,power_law_1.2,0.06156799793243408
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,power_law_1.01,0.5985023975372314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,power_law_1.01,0.05457280278205871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,power_law_1.2,0.070169597864151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,power_law_1.01,0.764185619354248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,power_law_1.01,0.05886719822883606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,power_law_1.2,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,power_law_1.01,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,power_law_1.01,0.9435903549194335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,power_law_1.2,0.0834879994392395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,power_law_1.01,0.0586624026298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,power_law_1.2,0.10192639827728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,power_law_1.01,1.534233570098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,power_law_1.01,0.05682560205459595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,power_law_1.2,0.11216000318527222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,power_law_1.01,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,power_law_1.01,3.0581439971923827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,power_law_1.2,0.14247039556503296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,power_law_1.01,0.0597055971622467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,power_law_1.2,0.167468798160553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,power_law_1.01,0.06378239989280701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,power_law_1.2,0.23586559295654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,power_law_1.2,0.2948415994644165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,power_law_1.2,0.42098560333251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,power_law_1.01,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,power_law_1.2,0.5248191833496094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,power_law_1.01,0.07258880138397217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,power_law_1.2,0.7658751964569092
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,power_law_1.2,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,power_law_1.01,0.07585920095443725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,power_law_1.2,0.05742719769477844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,power_law_1.2,1.0157247543334962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,power_law_1.01,0.0807807981967926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,power_law_1.2,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,power_law_1.2,1.2698944091796875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,power_law_1.01,0.09552639722824097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,power_law_1.2,0.055379199981689456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,power_law_1.01,0.10515199899673462
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,power_law_1.2,2.2455488204956056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,power_law_1.2,0.059468799829483034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,power_law_1.01,0.13383040428161622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,power_law_1.2,4.505311965942383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,power_law_1.2,0.05619199872016907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,power_law_1.01,0.15327999591827393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,power_law_1.01,0.19916160106658937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,power_law_1.2,0.05619840025901794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,power_law_1.01,0.24481918811798095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,power_law_1.2,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,power_law_1.2,0.05822719931602478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,power_law_1.01,0.32940800189971925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,power_law_1.2,0.05948160290718078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,power_law_1.01,0.4104959964752197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,power_law_1.2,0.06234239935874939
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,power_law_1.01,0.5804863929748535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,power_law_1.2,0.06212480068206787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,power_law_1.01,0.7613183975219726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,power_law_1.01,0.06750079989433289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,power_law_1.2,0.06418560147285461
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,power_law_1.01,0.9640895843505859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,power_law_1.2,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,power_law_1.01,0.05829120278358459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,power_law_1.01,1.5018815994262695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,power_law_1.2,0.07094399929046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,power_law_1.01,0.055219197273254396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,power_law_1.01,3.0077823638916015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,power_law_1.2,0.0738048017024994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,power_law_1.01,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,power_law_1.2,0.08158079981803894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,power_law_1.01,0.05482879877090454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,power_law_1.01,0.055225598812103274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,power_law_1.2,0.0967423975467682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,power_law_1.01,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,power_law_1.2,0.1082111954689026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,power_law_1.01,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,power_law_1.2,0.13600000143051147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,power_law_1.2,0.15900800228118897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,power_law_1.01,0.061363202333450315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,power_law_1.2,0.20856959819793702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,power_law_1.2,0.06870399713516236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,power_law_1.2,0.2652992010116577
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,power_law_1.2,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,power_law_1.01,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,power_law_1.2,0.053337597846984865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,power_law_1.2,0.3738431930541992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,power_law_1.01,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,power_law_1.2,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,power_law_1.2,0.4592448234558105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,power_law_1.01,0.07221119999885559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,power_law_1.2,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,power_law_1.2,0.6646527767181396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,power_law_1.01,0.07487360239028931
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,power_law_1.2,0.05539199709892273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,power_law_1.2,0.8927935600280762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,power_law_1.01,0.07878400087356567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,power_law_1.2,0.05682560205459595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,power_law_1.2,1.1563520431518555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,power_law_1.01,0.09086719751358033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,power_law_1.2,0.058259201049804685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,power_law_1.01,0.10273920297622681
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,power_law_1.2,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,power_law_1.2,1.766886329650879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,power_law_1.01,0.13366400003433226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,power_law_1.2,0.06071680188179016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,power_law_1.2,3.8113983154296873
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,power_law_1.2,0.063372802734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,power_law_1.01,0.15004160404205322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,power_law_1.2,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,power_law_1.01,0.1949056029319763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,power_law_1.2,0.06647040247917176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,power_law_1.01,0.24282240867614746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,power_law_1.2,0.06849920153617858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,power_law_1.01,0.33374719619750975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,power_law_1.2,0.07381759881973267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,power_law_1.01,0.4181312084197998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,power_law_1.2,0.0785215973854065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,power_law_1.2,0.0343423992395401
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,power_law_1.01,0.5805376052856446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,power_law_1.2,0.03372800052165985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,power_law_1.2,0.08241919875144958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,power_law_1.01,0.7486720085144043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,power_law_1.2,0.03392640054225922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,power_law_1.01,0.06439039707183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,power_law_1.2,0.09736319780349731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,power_law_1.2,0.035359999537467955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,power_law_1.01,0.8965439796447754
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,power_law_1.01,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,power_law_1.2,0.11396479606628418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,power_law_1.01,1.4193856239318847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,power_law_1.01,0.05496960282325745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,power_law_1.2,0.14097919464111328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,power_law_1.2,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,power_law_1.2,0.036601600050926206
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,power_law_1.01,0.05333120226860046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,power_law_1.2,0.16289279460906983
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,power_law_1.01,2.697932815551758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,power_law_1.2,0.04128639996051788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,power_law_1.01,0.05475839972496033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,power_law_1.2,0.21472640037536622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,power_law_1.2,0.041503998637199405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,power_law_1.2,0.04478079974651337
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,power_law_1.01,0.057625597715377806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,power_law_1.2,0.27307519912719724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,power_law_1.2,0.05194240212440491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,power_law_1.2,0.36728320121765134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,power_law_1.01,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,power_law_1.01,0.060703998804092406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,power_law_1.2,0.42810878753662107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,power_law_1.2,0.06649600267410279
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,power_law_1.01,0.06193280220031738
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,power_law_1.2,0.6552320003509522
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,power_law_1.2,0.10766079425811767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,power_law_1.01,0.06273919939994813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,power_law_1.2,0.8706879615783691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,power_law_1.2,0.1256832003593445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,power_law_1.2,0.06443520188331604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,power_law_1.2,0.17441279888153077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,power_law_1.2,1.149836826324463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,power_law_1.2,0.06547200083732604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,power_law_1.01,0.06602879762649536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,power_law_1.2,0.22030720710754395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,power_law_1.2,0.048870399594306946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,power_law_1.2,1.721843147277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,power_law_1.2,0.3202431917190552
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,power_law_1.01,0.06786559820175171
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,power_law_1.2,0.05132799744606018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,power_law_1.2,0.4210048198699951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,power_law_1.2,3.395872116088867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,power_law_1.01,0.07299200296401978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,power_law_1.2,0.05316479802131653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,power_law_1.2,0.5186816215515136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,power_law_1.01,0.0758463978767395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,power_law_1.2,0.7966015815734864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,power_law_1.2,0.057068800926208495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,power_law_1.01,0.08015999794006348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,power_law_1.2,1.586297607421875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,power_law_1.2,0.05727360248565674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,power_law_1.01,0.0801472008228302
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,power_law_1.2,0.05911039710044861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,power_law_1.01,0.09571200013160705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,power_law_1.01,0.10903040170669556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,power_law_1.2,0.061791998147964475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,power_law_1.01,0.13647359609603882
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,power_law_1.01,0.06480000019073487
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,power_law_1.2,0.06648319959640503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,power_law_1.01,0.15430400371551514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,power_law_1.01,0.06951680183410644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,power_law_1.2,0.06873599886894226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,power_law_1.01,0.20079360008239747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,power_law_1.2,0.0720192015171051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,power_law_1.01,0.056415998935699464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,power_law_1.01,0.24381439685821532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,power_law_1.2,0.0695680022239685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,power_law_1.2,0.07816960215568543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,power_law_1.01,0.05497599840164184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,power_law_1.2,0.06792960166931153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,power_law_1.01,0.32447359561920164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,power_law_1.01,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,power_law_1.2,0.08205440044403076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,power_law_1.2,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,power_law_1.01,0.4195136070251465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,power_law_1.01,0.0602944016456604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,power_law_1.2,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,power_law_1.2,0.05318400263786316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,power_law_1.01,0.6066944122314453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,power_law_1.01,0.06295679807662964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,power_law_1.2,0.09781119823455811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,power_law_1.2,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,power_law_1.01,0.7482111930847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,power_law_1.01,0.06335999965667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,power_law_1.2,0.10970239639282227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,power_law_1.2,0.058297598361968996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,power_law_1.01,0.9251584053039551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,power_law_1.01,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,power_law_1.2,0.139193594455719
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,power_law_1.2,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,power_law_1.01,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,power_law_1.01,1.499833583831787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,power_law_1.2,0.15987839698791503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,power_law_1.2,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,power_law_1.01,0.0686784029006958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,power_law_1.2,0.20840959548950194
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,power_law_1.2,0.06280320286750793
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,power_law_1.01,2.873414421081543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,power_law_1.01,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,power_law_1.2,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,power_law_1.2,0.24732160568237305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,power_law_1.01,0.07300480008125305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,power_law_1.2,0.06895359754562377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,power_law_1.2,0.350547194480896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,power_law_1.01,0.07669119834899903
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,power_law_1.2,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,power_law_1.2,0.4613183975219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,power_law_1.01,0.07975680232048035
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,power_law_1.2,0.07426559925079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,power_law_1.2,0.6405375957489013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,power_law_1.01,0.08487679958343505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,power_law_1.2,0.07571200132369996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,power_law_1.2,0.8523072242736817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,power_law_1.01,0.08876799941062927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,power_law_1.2,0.08452479839324951
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,power_law_1.2,1.0316991806030273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,power_law_1.01,0.10495359897613525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,power_law_1.2,0.08841599822044373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,power_law_1.2,1.574028778076172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,power_law_1.01,0.11722240447998047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,power_law_1.2,0.0933247983455658
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,power_law_1.01,0.14589439630508422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,power_law_1.01,0.06909440159797668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,power_law_1.2,0.110534405708313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,power_law_1.2,3.1220991134643556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,power_law_1.01,0.17006080150604247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,power_law_1.01,0.07033600211143494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,power_law_1.2,0.11994880437850952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,power_law_1.01,0.217574405670166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,power_law_1.01,0.05619840025901794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,power_law_1.2,0.15211520195007325
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,power_law_1.01,0.2689663887023926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,power_law_1.01,0.05783680081367493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,power_law_1.2,0.17482880353927613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,power_law_1.01,0.3707648038864136
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,power_law_1.01,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,power_law_1.2,0.21989760398864747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,power_law_1.01,0.45024638175964354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,power_law_1.2,0.2833856105804443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,power_law_1.01,0.06561920046806335
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,power_law_1.01,0.6466303825378418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,power_law_1.01,0.07134720087051391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,power_law_1.2,0.3767551898956299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,power_law_1.01,0.07420799732208253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,power_law_1.2,0.4953472137451172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,power_law_1.01,0.8415488243103028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,power_law_1.01,0.07423359751701356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,power_law_1.2,0.6946112155914307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,power_law_1.01,1.0009407997131348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,power_law_1.2,0.06648319959640503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,power_law_1.01,0.07584000229835511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,power_law_1.2,0.8973631858825684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,power_law_1.01,1.5649279594421386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,power_law_1.2,0.06914560198783874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,power_law_1.01,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,power_law_1.2,1.0526016235351563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,power_law_1.01,3.0102272033691406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,power_law_1.01,0.08732159733772278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,power_law_1.2,0.056454402208328244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,power_law_1.2,1.8132352828979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,power_law_1.01,0.08691200017929077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,power_law_1.2,0.05971840023994446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,power_law_1.01,0.08424959778785705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,power_law_1.2,3.397971343994141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,power_law_1.2,0.06416640281677247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,power_law_1.01,0.09019520282745361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,power_law_1.2,0.06832000017166137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,power_law_1.01,0.0934719979763031
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,power_law_1.2,0.07317759990692138
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,power_law_1.01,0.10002559423446655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,power_law_1.01,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,power_law_1.01,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,power_law_1.01,0.11455999612808228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,power_law_1.2,0.07468799948692321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,power_law_1.2,0.07794560194015503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,power_law_1.01,0.13566720485687256
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,power_law_1.01,0.03552640080451965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,power_law_1.2,0.07980160117149353
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,power_law_1.01,0.16453759670257567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,power_law_1.2,0.03495680093765259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,power_law_1.01,0.034892800450325015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,power_law_1.2,0.08184959888458251
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,power_law_1.2,0.03373439908027649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,power_law_1.01,0.1919808030128479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,power_law_1.01,0.035519999265670774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,power_law_1.2,0.08390399813652039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,power_law_1.01,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,power_law_1.01,0.24584319591522216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,power_law_1.01,0.03654400110244751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,power_law_1.2,0.09168639779090881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,power_law_1.01,0.29375998973846434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,power_law_1.2,0.03351680040359497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,power_law_1.01,0.036550399661064145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,power_law_1.2,0.09454079866409301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,power_law_1.01,0.4104896068572998
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,power_law_1.2,0.03495039939880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,power_law_1.01,0.03653759956359863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,power_law_1.2,0.10397440195083618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,power_law_1.01,0.5243584156036377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,power_law_1.2,0.0355648010969162
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,power_law_1.01,0.037350401282310486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,power_law_1.2,0.12076159715652465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,power_law_1.2,0.03516159951686859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,power_law_1.01,0.03839359879493713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,power_law_1.01,0.7183167934417725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,power_law_1.2,0.138374400138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,power_law_1.2,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,power_law_1.01,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,power_law_1.01,0.9440064430236816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,power_law_1.2,0.1699072003364563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,power_law_1.01,0.04021120071411133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,power_law_1.2,0.03616639971733093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,power_law_1.01,1.1514623641967774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,power_law_1.2,0.19325439929962157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,power_law_1.01,0.04431999921798706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,power_law_1.2,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,power_law_1.01,0.04474239945411682
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,power_law_1.2,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,power_law_1.01,1.8610879898071289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,power_law_1.2,0.26289279460906984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,power_law_1.01,0.046393600106239316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,power_law_1.2,0.03966720104217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,power_law_1.2,0.32309761047363283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,power_law_1.01,3.5523136138916014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,power_law_1.01,0.05084800124168396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,power_law_1.2,0.04336000084877014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,power_law_1.2,0.4400383949279785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,power_law_1.01,0.057017600536346434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,power_law_1.2,0.045798400044441225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,power_law_1.2,0.5600512027740479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,power_law_1.01,0.06664320230484008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,power_law_1.2,0.04764159917831421
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,power_law_1.01,0.08035200238227844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,power_law_1.2,0.8117504119873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,power_law_1.2,0.054816001653671266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,power_law_1.01,0.10698879957199096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,power_law_1.2,0.060755199193954466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,power_law_1.2,0.9751744270324707
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,power_law_1.01,0.12789119482040406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,power_law_1.2,0.07674239873886109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,power_law_1.2,1.251046371459961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,power_law_1.01,0.03632639944553375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,power_law_1.01,0.17949440479278564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,power_law_1.2,0.0861631989479065
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,power_law_1.2,2.0423871994018556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,power_law_1.01,0.03345920145511627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,power_law_1.01,0.2204416036605835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,power_law_1.2,0.11401599645614624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,power_law_1.01,0.0328575998544693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,power_law_1.2,0.15679359436035156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,power_law_1.01,0.32857599258422854
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,power_law_1.2,4.105747222900391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,power_law_1.01,0.034508800506591795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,power_law_1.2,0.2338047981262207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,power_law_1.01,0.39738879203796384
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,power_law_1.01,0.03505280017852783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,power_law_1.2,0.26576640605926516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,power_law_1.01,0.4768511772155762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,power_law_1.01,0.035724800825119016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,power_law_1.2,0.3825088024139404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,power_law_1.01,0.8096511840820313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,power_law_1.01,0.03570559918880463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,power_law_1.2,0.48181757926940916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,power_law_1.01,1.5043392181396484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,power_law_1.2,0.613708782196045
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,power_law_1.01,0.03633280098438263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,power_law_1.2,0.03596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,power_law_1.2,1.0411392211914063
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,power_law_1.01,0.03694719970226288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,power_law_1.2,0.03372159898281098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,power_law_1.01,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,power_law_1.2,1.904364776611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,power_law_1.2,0.03270399868488312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,power_law_1.01,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,power_law_1.2,0.03331199884414673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,power_law_1.01,0.041657599806785586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,power_law_1.2,0.03455359935760498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,power_law_1.01,0.04207360148429871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,power_law_1.01,0.039628800749778745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,power_law_1.2,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,power_law_1.01,0.046367999911308286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,power_law_1.01,0.03490560054779053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,power_law_1.2,0.03473919928073883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,power_law_1.01,0.046374401450157164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,power_law_1.01,0.03511680066585541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,power_law_1.2,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,power_law_1.01,0.0344895988702774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,power_law_1.2,0.03555839955806732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,power_law_1.01,0.05107839703559876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,power_law_1.2,0.03740800023078918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,power_law_1.2,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,power_law_1.01,0.054764801263809205
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,power_law_1.2,0.03330560028553009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,power_law_1.01,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,power_law_1.2,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,power_law_1.01,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,power_law_1.2,0.032492798566818235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,power_law_1.01,0.037363201379776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,power_law_1.2,0.04008319973945618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,power_law_1.2,0.032492798566818235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,power_law_1.01,0.07975040078163147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,power_law_1.01,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,power_law_1.2,0.034143999218940735
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,power_law_1.01,0.09859200119972229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,power_law_1.01,0.039827200770378116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,power_law_1.2,0.04170239865779877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,power_law_1.2,0.035545599460601804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,power_law_1.01,0.1262336015701294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,power_law_1.01,0.040627199411392215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,power_law_1.2,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,power_law_1.2,0.0367935985326767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,power_law_1.01,0.17170560359954834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,power_law_1.01,0.042284798622131345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,power_law_1.2,0.04702720046043396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,power_law_1.2,0.03760640025138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,power_law_1.01,0.210809588432312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,power_law_1.2,0.04928640127182007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,power_law_1.2,0.03861759901046753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,power_law_1.01,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,power_law_1.01,0.2995007991790771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,power_law_1.2,0.052960002422332765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,power_law_1.01,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,power_law_1.2,0.039468801021575926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,power_law_1.01,0.40188159942626955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,power_law_1.01,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,power_law_1.2,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,power_law_1.2,0.04028159976005554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,power_law_1.01,0.4883264064788818
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,power_law_1.01,0.04555520117282867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,power_law_1.2,0.06997119784355163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,power_law_1.2,0.04026240110397339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,power_law_1.01,0.7170815944671631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,power_law_1.01,0.047193598747253415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,power_law_1.2,0.08470399975776673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,power_law_1.2,0.04255360066890716
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,power_law_1.01,0.0488319993019104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,power_law_1.2,0.11829760074615478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,power_law_1.2,0.041280001401901245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,power_law_1.01,1.4173055648803712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,power_law_1.01,0.053958398103713986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,power_law_1.2,0.04498560130596161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,power_law_1.2,0.14042240381240845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,power_law_1.01,0.05825279951095581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,power_law_1.2,0.21025280952453612
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,power_law_1.2,0.050316798686981204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,power_law_1.01,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,power_law_1.2,0.23463680744171142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,power_law_1.2,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,power_law_1.01,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,power_law_1.2,0.3947711944580078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,power_law_1.2,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,power_law_1.01,0.10618239641189575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,power_law_1.2,0.4986112117767334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,power_law_1.2,0.07692800164222717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,power_law_1.01,0.132806396484375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,power_law_1.2,0.597331190109253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,power_law_1.01,0.04186240136623383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,power_law_1.2,0.0896448016166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,power_law_1.01,0.1864575982093811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,power_law_1.2,0.9800704002380372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,power_law_1.01,0.03612160086631775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,power_law_1.2,0.12035200595855713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,power_law_1.01,0.2159679889678955
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,power_law_1.01,0.033670398592948916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,power_law_1.2,0.14328320026397706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,power_law_1.01,0.29827840328216554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,power_law_1.2,2.084172821044922
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,power_law_1.01,0.03530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,power_law_1.2,0.19838080406188965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,power_law_1.01,0.4023104190826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,power_law_1.01,0.036134400963783266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,power_law_1.2,0.23831679821014404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,power_law_1.01,0.4617023944854736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,power_law_1.01,0.03857919871807099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,power_law_1.2,0.3968319892883301
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,power_law_1.01,0.7404096126556396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,power_law_1.01,0.038380798697471616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,power_law_1.2,0.4879551887512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,power_law_1.01,0.03980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,power_law_1.01,1.5313728332519532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,power_law_1.2,0.5907455921173096
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,power_law_1.01,0.0394239991903305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,power_law_1.2,1.1335040092468263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,power_law_1.2,0.041094401478767396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,power_law_1.01,0.04102399945259094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,power_law_1.2,0.03351039886474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,power_law_1.01,0.04227199852466583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,power_law_1.2,2.1247232437133787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,power_law_1.2,0.032691198587417605
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,power_law_1.01,0.043705600500106814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,power_law_1.2,0.034694400429725644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,power_law_1.01,0.044121599197387694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,power_law_1.2,0.03575679957866669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,power_law_1.2,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,power_law_1.2,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,power_law_1.01,0.046988800168037415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,power_law_1.2,0.03944959938526153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,power_law_1.01,0.03696640133857727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,power_law_1.2,0.040275201201438904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,power_law_1.01,0.03552640080451965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,power_law_1.2,0.04007039964199066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,power_law_1.01,0.03695360124111176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,power_law_1.2,0.04170880019664765
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,power_law_1.2,0.04314239919185638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,power_law_1.01,0.03818880021572113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,power_law_1.2,0.03475840091705322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,power_law_1.01,0.041843199729919435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,power_law_1.2,0.03433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,power_law_1.2,0.0456063985824585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,power_law_1.01,0.04222719967365265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,power_law_1.2,0.03534719944000244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,power_law_1.2,0.045798400044441225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,power_law_1.01,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,power_law_1.2,0.03783040046691895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,power_law_1.2,0.04970879852771759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,power_law_1.01,0.04412800073623657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,power_law_1.2,0.0412992000579834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,power_law_1.2,0.05256320238113403
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,power_law_1.2,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,power_law_1.2,0.05072640180587769
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,power_law_1.01,0.04678399860858917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,power_law_1.2,0.04294399917125702
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,power_law_1.01,0.0486272007226944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,power_law_1.2,0.043558400869369504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,power_law_1.2,0.06260480284690857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,power_law_1.01,0.050271999835968015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,power_law_1.2,0.043756800889968875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,power_law_1.2,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,power_law_1.01,0.04924159944057464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,power_law_1.2,0.04642559885978699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,power_law_1.2,0.09433599710464477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,power_law_1.01,0.05456640124320984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,power_law_1.2,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,power_law_1.01,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,power_law_1.2,0.13262720108032228
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,power_law_1.2,0.05092480182647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,power_law_1.01,0.059084802865982056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,power_law_1.2,0.15741440057754516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,power_law_1.2,0.04867199957370758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,power_law_1.01,0.06521599888801574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,power_law_1.2,0.22848000526428222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,power_law_1.2,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,power_law_1.01,0.07033600211143494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,power_law_1.2,0.2770240068435669
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,power_law_1.2,0.05626239776611328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,power_law_1.01,0.08815360069274902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,power_law_1.2,0.4568448066711426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,power_law_1.01,0.1016767978668213
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,power_law_1.2,0.4961599826812744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,power_law_1.2,0.06668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,power_law_1.01,0.13813120126724243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,power_law_1.2,0.6712575912475586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,power_law_1.2,0.07243520021438599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,power_law_1.01,0.16554880142211914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,power_law_1.2,1.003046417236328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,power_law_1.2,0.09189119935035706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,power_law_1.01,0.23561599254608154
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,power_law_1.2,0.10766079425811767
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,power_law_1.01,0.3011264085769653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,power_law_1.2,2.6741952896118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,power_law_1.2,0.1438976049423218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,power_law_1.01,0.4031424045562744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,power_law_1.2,0.18098560571670533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,power_law_1.01,0.5583680152893067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,power_law_1.2,0.2366719961166382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,power_law_1.01,0.6400832176208496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,power_law_1.2,0.2878848075866699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,power_law_1.01,0.9706239700317383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,power_law_1.2,0.45027837753295896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,power_law_1.2,0.6425343990325928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,power_law_1.01,1.8815040588378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,power_law_1.2,0.7847104072570801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,power_law_1.01,0.05583360195159912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,power_law_1.01,0.05562880039215088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,power_law_1.2,1.293177604675293
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,power_law_1.01,0.04969600141048432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,power_law_1.2,2.6152320861816407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,power_law_1.01,0.051123201847076416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,power_law_1.01,0.051948797702789304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,power_law_1.01,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,power_law_1.2,0.06050559878349304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,power_law_1.2,0.056620800495147706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,power_law_1.01,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,power_law_1.2,0.05089920163154602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,power_law_1.01,0.05911039710044861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,power_law_1.2,0.052121597528457644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,power_law_1.01,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,power_law_1.2,0.05129600167274475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,power_law_1.01,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,power_law_1.2,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,power_law_1.01,0.05790079832077026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,power_law_1.01,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,power_law_1.2,0.0574400007724762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,power_law_1.2,0.05702400207519531
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,power_law_1.01,0.05052800178527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,power_law_1.2,0.05742719769477844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,power_law_1.2,0.05968639850616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,power_law_1.01,0.052774399518966675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,power_law_1.2,0.061740797758102414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,power_law_1.01,0.05728639960289002
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,power_law_1.01,0.05764480233192444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,power_law_1.2,0.06277120113372803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,power_law_1.01,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,power_law_1.2,0.06317440271377564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,power_law_1.01,0.05851519703865051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,power_law_1.2,0.0676800012588501
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,power_law_1.01,0.06199679970741272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,power_law_1.2,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,power_law_1.01,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,power_law_1.2,0.07587199807167053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,power_law_1.2,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,power_law_1.01,0.06997119784355163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,power_law_1.2,0.08672000169754028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,power_law_1.01,0.06976640224456787
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,power_law_1.2,0.09921919703483581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,power_law_1.01,0.07570559978485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,power_law_1.2,0.12993279695510865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,power_law_1.01,0.07693439722061157
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,power_law_1.2,0.15000319480895996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,power_law_1.01,0.08083199858665466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,power_law_1.2,0.19833600521087646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,power_law_1.01,0.0927295982837677
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,power_law_1.2,0.23418240547180175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,power_law_1.01,0.10357120037078857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,power_law_1.2,0.31712639331817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,power_law_1.01,0.13530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,power_law_1.2,0.40968961715698243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,power_law_1.01,0.15415040254592896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,power_law_1.2,0.6839231967926025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,power_law_1.01,0.1942720055580139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,power_law_1.2,0.7482304096221923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,power_law_1.01,0.23463680744171142
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,power_law_1.2,0.96693115234375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,power_law_1.01,0.3304768085479736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,power_law_1.2,1.5514431953430177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,power_law_1.01,0.3833215951919556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,power_law_1.01,0.5744063854217529
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,power_law_1.2,3.037260818481445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,power_law_1.01,0.7269824028015137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,power_law_1.01,0.8833600044250488
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,power_law_1.01,1.3514112472534179
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,power_law_1.01,3.0963136672973635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,power_law_1.2,0.06805760264396668
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,power_law_1.2,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,power_law_1.2,0.05169919729232788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,power_law_1.2,0.052108800411224364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,power_law_1.2,0.05469440221786499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,power_law_1.2,0.060710400342941284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,power_law_1.01,0.055430400371551516
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,power_law_1.2,0.061337602138519284
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,power_law_1.2,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,power_law_1.01,0.051551997661590576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,power_law_1.2,0.06829439997673034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,power_law_1.01,0.053388798236846925
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,power_law_1.2,0.06931840181350708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,power_law_1.01,0.05625600218772888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,power_law_1.01,0.0640447974205017
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,power_law_1.2,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,power_law_1.01,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,power_law_1.2,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,power_law_1.01,0.06547840237617493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,power_law_1.2,0.07710080146789551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,power_law_1.01,0.06874880194664001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,power_law_1.01,0.073580801486969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,power_law_1.01,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,power_law_1.01,0.08145279884338379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,power_law_1.01,0.08472959995269776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,power_law_1.01,0.09045760035514831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,power_law_1.01,0.1043776035308838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,power_law_1.01,0.12295039892196655
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,power_law_1.01,0.14986239671707152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,power_law_1.01,0.17032320499420167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,power_law_1.01,0.22439041137695312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,power_law_1.01,0.2592128038406372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,power_law_1.01,0.35895040035247805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,power_law_1.01,0.44162559509277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,power_law_1.01,0.6774144172668457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,power_law_1.01,0.043910399079322815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,power_law_1.01,0.8318335533142089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,power_law_1.01,0.050457602739334105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,power_law_1.01,1.0432064056396484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,power_law_1.01,0.05025920271873474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,power_law_1.01,1.5342911720275878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,power_law_1.01,0.05087360143661499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,power_law_1.01,0.05660799741744995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,power_law_1.01,3.2332927703857424
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,power_law_1.01,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,power_law_1.01,0.07585920095443725
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,power_law_1.01,0.08609920144081115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,power_law_1.01,0.11518080234527588
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,power_law_1.01,0.14958080053329467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,power_law_1.01,0.18951040506362915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,power_law_1.01,0.23539841175079346
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,power_law_1.01,0.3363584041595459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,power_law_1.01,0.428934383392334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,power_law_1.01,0.5432127952575684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,power_law_1.2,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,power_law_1.01,0.8530688285827637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,power_law_1.2,0.050316798686981204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,power_law_1.2,0.05113599896430969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,power_law_1.01,1.5272831916809082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,power_law_1.2,0.05318400263786316
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,power_law_1.2,0.05603839755058289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,power_law_1.2,0.06341760158538819
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,power_law_1.2,0.06301440000534057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,power_law_1.2,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,power_law_1.2,0.07080320119857789
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,power_law_1.2,0.06997119784355163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,power_law_1.01,0.06684160232543945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,power_law_1.2,0.07284479737281799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,power_law_1.01,0.06110720038414001
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,power_law_1.2,0.07652480006217957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,power_law_1.2,0.07509120106697083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,power_law_1.01,0.057011198997497556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,power_law_1.2,0.08349440097808838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,power_law_1.01,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,power_law_1.2,0.085343998670578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,power_law_1.01,0.055795198678970336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,power_law_1.2,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,power_law_1.01,0.05803520083427429
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,power_law_1.2,0.10601600408554077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,power_law_1.2,0.12691199779510498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,power_law_1.01,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,power_law_1.2,0.15516799688339233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,power_law_1.01,0.05968639850616455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,power_law_1.2,0.18056960105895997
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,power_law_1.01,0.06255360245704651
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,power_law_1.2,0.22766718864440919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,power_law_1.01,0.06335999965667724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,power_law_1.2,0.2866624116897583
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,power_law_1.2,0.3972480058670044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,power_law_1.2,0.5273024082183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,power_law_1.2,0.695033597946167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,power_law_1.2,1.0067328453063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,power_law_1.2,1.1089280128479004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,power_law_1.2,1.9915903091430665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,power_law_1.2,3.8159744262695314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,power_law_1.01,0.070169597864151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,power_law_1.01,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,power_law_1.01,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,power_law_1.2,0.07898240089416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,power_law_1.01,0.08389760255813598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,power_law_1.2,0.07752320170402527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,power_law_1.01,0.09658880233764648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,power_law_1.2,0.05441920161247253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,power_law_1.01,0.11624959707260132
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,power_law_1.01,0.14083199501037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,power_law_1.2,0.05665919780731201
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,power_law_1.01,0.18260480165481568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,power_law_1.2,0.056454402208328244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,power_law_1.01,0.21393280029296874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,power_law_1.01,0.29319679737091064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,power_law_1.2,0.05932160019874573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,power_law_1.01,0.3612096071243286
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,power_law_1.2,0.06136959791183472
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,power_law_1.01,0.5113344192504883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,power_law_1.2,0.05891839861869812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,power_law_1.01,0.6810815811157227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,power_law_1.2,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,power_law_1.01,0.833465576171875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,power_law_1.2,0.06670719981193543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,power_law_1.01,1.332153606414795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,power_law_1.2,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,power_law_1.01,2.6205440521240235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,power_law_1.2,0.07079039812088013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,power_law_1.2,0.07612159848213196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,power_law_1.2,0.07939839959144593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,power_law_1.2,0.08881919980049133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,power_law_1.2,0.10226559638977051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,power_law_1.2,0.1189120054244995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,power_law_1.2,0.14840960502624512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,power_law_1.01,0.06259199976921082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,power_law_1.2,0.1693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,power_law_1.01,0.06832000017166137
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,power_law_1.2,0.2256256103515625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,power_law_1.2,0.27314560413360595
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,power_law_1.01,0.05604479908943176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,power_law_1.2,0.3726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,power_law_1.01,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,power_law_1.01,0.056454402208328244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,power_law_1.2,0.47855358123779296
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,power_law_1.01,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,power_law_1.2,0.7138751983642578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,power_law_1.01,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,power_law_1.2,0.8805631637573242
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,power_law_1.01,0.06034560203552246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,power_law_1.2,1.1432576179504395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,power_law_1.01,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,power_law_1.2,1.8595199584960938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,power_law_1.2,3.8171905517578124
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,power_law_1.01,0.06785920262336731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,power_law_1.01,0.07407360076904297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,power_law_1.01,0.08062080144882203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,power_law_1.01,0.08019840121269226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,power_law_1.01,0.09004160165786743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,power_law_1.01,0.10192639827728271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,power_law_1.2,0.07366399765014649
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,power_law_1.01,0.11337599754333497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,power_law_1.2,0.08119040131568908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,power_law_1.2,0.06547200083732604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,power_law_1.01,0.13979519605636598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,power_law_1.2,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,power_law_1.2,0.06465920209884643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,power_law_1.01,0.1643839955329895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,power_law_1.2,0.09757440090179444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,power_law_1.2,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,power_law_1.01,0.21536641120910643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,power_law_1.2,0.10821759700775146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,power_law_1.01,0.25797760486602783
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,power_law_1.2,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,power_law_1.2,0.16453759670257567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,power_law_1.01,0.3476991891860962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,power_law_1.2,0.1981376051902771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,power_law_1.2,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,power_law_1.01,0.4383999824523926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,power_law_1.2,0.24995839595794678
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,power_law_1.2,0.060550397634506224
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,power_law_1.01,0.6284543991088867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,power_law_1.2,0.3535615921020508
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,power_law_1.2,0.05911679863929749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,power_law_1.01,0.8129728317260743
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,power_law_1.2,0.4445055961608887
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,power_law_1.2,0.06219519972801209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,power_law_1.01,0.9768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,power_law_1.2,0.603436803817749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,power_law_1.2,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,power_law_1.2,0.8284992218017578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,power_law_1.01,1.5203455924987792
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,power_law_1.2,0.06792960166931153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,power_law_1.2,1.0505151748657227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,power_law_1.2,0.06997119784355163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,power_law_1.01,2.9754816055297852
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,power_law_1.2,1.6395135879516602
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,power_law_1.2,0.07181439995765686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,power_law_1.2,0.0822655975818634
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,power_law_1.2,3.7778175354003904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,power_law_1.2,0.08428800106048584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,power_law_1.2,0.08922880291938781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,power_law_1.2,0.10274560451507568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,power_law_1.2,0.11585279703140258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,power_law_1.2,0.14636160135269166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,power_law_1.01,0.06710399985313416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,power_law_1.2,0.16869759559631348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,power_law_1.01,0.0671231985092163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,power_law_1.2,0.2178368091583252
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,power_law_1.2,0.08015360236167908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,power_law_1.01,0.06751999855041504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,power_law_1.2,0.27518720626831056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,power_law_1.2,0.0760640025138855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,power_law_1.01,0.05234559774398804
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,power_law_1.2,0.06234880089759827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,power_law_1.2,0.3697983980178833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,power_law_1.01,0.05440639853477478
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,power_law_1.2,0.053548800945281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,power_law_1.2,0.4761023998260498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,power_law_1.01,0.05686399936676025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,power_law_1.01,0.05971840023994446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,power_law_1.2,0.6942080020904541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,power_law_1.2,0.05906559824943543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,power_law_1.01,0.06320639848709106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,power_law_1.2,0.8633791923522949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,power_law_1.2,0.06152960062026978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,power_law_1.2,1.0896703720092773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,power_law_1.2,0.06519039869308471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,power_law_1.01,0.06689919829368592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,power_law_1.2,1.660851287841797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,power_law_1.01,0.0664896011352539
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,power_law_1.2,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,power_law_1.2,3.5110206604003906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,power_law_1.01,0.07201279997825623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,power_law_1.2,0.06788480281829834
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,power_law_1.01,0.0716159999370575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,power_law_1.2,0.07299839854240417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,power_law_1.01,0.07816960215568543
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,power_law_1.2,0.07175040245056152
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,power_law_1.01,0.0855296015739441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,power_law_1.2,0.07525759935379028
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,power_law_1.01,0.09002879858016968
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,power_law_1.2,0.08073599934577942
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,power_law_1.01,0.09166719913482665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,power_law_1.2,0.08610560297966004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,power_law_1.01,0.10517760515213012
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,power_law_1.2,0.0869055986404419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,power_law_1.01,0.07038080096244811
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,power_law_1.01,0.12158080339431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,power_law_1.2,0.0996288001537323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,power_law_1.01,0.06915839910507202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,power_law_1.01,0.149017596244812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,power_law_1.2,0.11109119653701782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,power_law_1.01,0.07428479790687562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,power_law_1.01,0.17237119674682616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,power_law_1.2,0.12174079418182374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,power_law_1.01,0.05317760109901428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,power_law_1.2,0.15304319858551024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,power_law_1.01,0.21865599155426024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,power_law_1.01,0.05563520193099976
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,power_law_1.2,0.17704319953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,power_law_1.01,0.26739840507507323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,power_law_1.01,0.060140800476074216
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,power_law_1.2,0.22619519233703614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,power_law_1.01,0.35710721015930175
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,power_law_1.01,0.06316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,power_law_1.01,0.06443520188331604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,power_law_1.2,0.27411839962005613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,power_law_1.01,0.45969281196594236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,power_law_1.01,0.06561279892921448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,power_law_1.01,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,power_law_1.2,0.38593919277191163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,power_law_1.01,0.6761792182922364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,power_law_1.01,0.06787199974060058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,power_law_1.01,0.0691648006439209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,power_law_1.2,0.5034815788269043
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,power_law_1.01,0.8322367668151855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,power_law_1.01,0.07012479901313781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,power_law_1.01,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,power_law_1.2,0.6830848217010498
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,power_law_1.01,1.0521792411804198
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,power_law_1.01,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,power_law_1.01,0.076665598154068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,power_law_1.2,0.9030464172363282
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,power_law_1.01,0.0779583990573883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,power_law_1.01,0.07953919768333435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,power_law_1.01,1.5833600044250489
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,power_law_1.2,1.108454418182373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,power_law_1.01,0.08021119832992554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,power_law_1.01,0.08526719808578491
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,power_law_1.01,3.077459144592285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,power_law_1.01,0.08635519742965699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,power_law_1.01,0.101254403591156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,power_law_1.2,1.811961555480957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,power_law_1.01,0.09393919706344604
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,power_law_1.01,0.11108479499816895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,power_law_1.2,3.570150375366211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,power_law_1.01,0.09659519791603088
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,power_law_1.01,0.1360703945159912
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,power_law_1.01,0.09742079973220825
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,power_law_1.01,0.16350719928741456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,power_law_1.01,0.1121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,power_law_1.01,0.21266560554504393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,power_law_1.01,0.13059840202331544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,power_law_1.01,0.25813119411468505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,power_law_1.01,0.15904639959335326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,power_law_1.01,0.34186880588531493
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,power_law_1.2,0.06832640171051026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,power_law_1.01,0.18262399435043336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,power_law_1.01,0.44941439628601076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,power_law_1.2,0.06915199756622314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,power_law_1.01,0.236678409576416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,power_law_1.01,0.6296127796173095
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,power_law_1.2,0.0634112000465393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,power_law_1.01,0.29114880561828616
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,power_law_1.01,0.804319953918457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,power_law_1.2,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,power_law_1.01,0.3872191905975342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,power_law_1.01,0.06993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,power_law_1.2,0.05624960064888
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,power_law_1.01,1.0378047943115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,power_law_1.01,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,power_law_1.01,0.5047743797302247
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,power_law_1.01,1.5362624168395995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,power_law_1.01,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,power_law_1.01,0.7109888076782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,power_law_1.2,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,power_law_1.01,0.05661439895629883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,power_law_1.01,0.9043328285217285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,power_law_1.01,3.0978879928588867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,power_law_1.2,0.06812800168991089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,power_law_1.01,0.06294400095939637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,power_law_1.01,1.104422378540039
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,power_law_1.2,0.07078400254249573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,power_law_1.01,0.06807680130004883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,power_law_1.2,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,power_law_1.01,1.6760000228881835
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,power_law_1.01,0.07341439723968506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,power_law_1.2,0.07529600262641907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,power_law_1.01,0.07955200076103211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,power_law_1.01,3.421311950683594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,power_law_1.2,0.07651200294494628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,power_law_1.01,0.08426240086555481
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,power_law_1.2,0.07896959781646729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,power_law_1.01,0.08446720242500305
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,power_law_1.2,0.08206080198287964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,8,power_law_1.01,0.018361599743366243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,8,power_law_1.01,0.018783999979496
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,power_law_1.01,0.08877440094947815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,power_law_1.2,0.08757759928703308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,8,power_law_1.01,0.018771199882030486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,power_law_1.01,0.09409919977188111
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,power_law_1.2,0.09105920195579528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,8,power_law_1.01,0.01918720006942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,power_law_1.2,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,8,power_law_1.01,0.01918720006942749
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,power_law_1.01,0.0945088028907776
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,power_law_1.2,0.09864320158958435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,power_law_1.2,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,8,power_law_1.01,0.019993600249290467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,power_law_1.01,0.09553279876708984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,power_law_1.2,0.11626240015029907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,power_law_1.2,0.05865600109100342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,8,power_law_1.01,0.020627200603485107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,8,power_law_1.01,0.02082560062408447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,power_law_1.01,0.10350719690322877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,power_law_1.2,0.13509119749069215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,power_law_1.2,0.05658239722251892
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,8,power_law_1.01,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,power_law_1.01,0.10781439542770385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,power_law_1.2,0.16172800064086915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,power_law_1.2,0.06111360192298889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,8,power_law_1.01,0.022463999688625336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,power_law_1.01,0.11560319662094116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,8,power_law_1.01,0.02328319996595383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,power_law_1.2,0.19039360284805298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,power_law_1.2,0.06643840074539184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,8,power_law_1.01,0.02696320116519928
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,power_law_1.01,0.1364799976348877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,power_law_1.2,0.24078080654144288
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,8,power_law_1.01,0.027372801303863527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,power_law_1.01,0.15123840570449829
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,8,power_law_1.01,0.028799998760223388
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,power_law_1.2,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,power_law_1.2,0.30610558986663816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,8,power_law_1.01,0.02961919903755188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,power_law_1.01,0.187283194065094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,power_law_1.2,0.0832319974899292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,power_law_1.2,0.40133118629455566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,8,power_law_1.01,0.03043839931488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,power_law_1.01,0.21758720874786378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,8,power_law_1.01,0.03208320140838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,power_law_1.2,0.0840448021888733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,power_law_1.2,0.5150015830993653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,8,power_law_1.01,0.03475199937820435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,power_law_1.01,0.2778048038482666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,power_law_1.2,0.08630399703979492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,power_law_1.2,0.7367936134338379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,8,power_law_1.01,0.03925760090351105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,power_law_1.01,0.32899839878082277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,8,power_law_1.01,0.05544959902763367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,power_law_1.2,0.08814719915390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,power_law_1.2,0.9493824005126953
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,8,power_law_1.01,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,power_law_1.01,0.4498303890228271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,power_law_1.2,0.08979200124740601
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,8,power_law_1.01,0.08716800212860107
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,power_law_1.2,1.198630428314209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,power_law_1.01,0.5755775928497314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,8,power_law_1.01,0.10375679731369018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,power_law_1.2,0.09552000164985656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,power_law_1.2,1.83819522857666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,8,power_law_1.01,0.15271040201187133
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,power_law_1.01,0.8305600166320801
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,power_law_1.2,0.10370559692382812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,8,power_law_1.01,0.1854848027229309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,power_law_1.01,1.0304384231567383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,power_law_1.2,3.669728088378906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,power_law_1.2,0.10329600572586059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,8,power_law_1.01,0.26145920753479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,8,power_law_1.01,0.35382399559020994
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,power_law_1.2,0.11640959978103638
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,power_law_1.01,1.2870400428771973
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,8,power_law_1.01,0.39047040939331057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,power_law_1.2,0.1375167965888977
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,8,power_law_1.01,0.6276351928710937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,power_law_1.01,2.0120447158813475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,6144,16384,2,8,32,8,power_law_1.2,0.018777599930763243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,power_law_1.2,0.15365760326385497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,6144,16384,2,8,32,8,power_law_1.2,0.01834239959716797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,8,power_law_1.01,1.3186240196228027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,6144,16384,2,8,32,8,power_law_1.2,0.01875839978456497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,power_law_1.01,3.8560512542724608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,power_law_1.2,0.19013760089874268
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,6144,16384,2,8,32,8,power_law_1.2,0.018559999763965607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,power_law_1.2,0.2190079927444458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,6144,16384,2,8,32,8,power_law_1.2,0.018764799833297728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,8,power_law_1.01,0.036185601353645326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,6144,16384,2,8,32,8,power_law_1.2,0.01916159987449646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,6144,16384,2,8,32,8,power_law_1.2,0.038176000118255615
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,power_law_1.2,0.28270080089569094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,8,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,6144,16384,2,8,32,8,power_law_1.2,0.02019840031862259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,6144,16384,2,8,32,8,power_law_1.2,0.039827200770378116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,8,power_law_1.01,0.0382207989692688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,power_law_1.2,0.3441472053527832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,6144,16384,2,8,32,8,power_law_1.2,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,6144,16384,2,8,32,8,power_law_1.2,0.039417600631713866
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,8,power_law_1.01,0.03761920034885406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,6144,16384,2,8,32,8,power_law_1.2,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,6144,16384,2,8,32,8,power_law_1.2,0.03941119909286499
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,8,power_law_1.01,0.036556801199913024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,power_law_1.2,0.4678463935852051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,6144,16384,2,8,32,8,power_law_1.2,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,6144,16384,2,8,32,8,power_law_1.2,0.03900800049304962
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,8,power_law_1.01,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,power_law_1.2,0.5936063766479492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,6144,16384,2,8,32,8,power_law_1.2,0.023263999819755556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,6144,16384,2,8,32,8,power_law_1.2,0.04023039937019348
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,8,power_law_1.01,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,6144,16384,2,8,32,8,power_law_1.2,0.027372801303863527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,6144,16384,2,8,32,8,power_law_1.2,0.040243199467658995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,8,power_law_1.01,0.03925119936466217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,power_law_1.2,0.8751872062683106
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,6144,16384,2,8,32,8,power_law_1.2,0.02778240144252777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,8,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,6144,16384,2,8,32,8,power_law_1.2,0.028191998600959778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,power_law_1.2,1.0711872100830078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,8,power_law_1.01,0.03903999924659729
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,6144,16384,2,8,32,8,power_law_1.2,0.029625600576400755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,8,power_law_1.01,0.040479999780654904
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,power_law_1.2,1.2940032005310058
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,6144,16384,2,8,32,8,power_law_1.2,0.03043839931488037
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,8,power_law_1.01,0.04007680118083954
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,6144,16384,2,8,32,8,power_law_1.2,0.0322816014289856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,8,power_law_1.01,0.04131839871406555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,power_law_1.2,2.057907295227051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,6144,16384,2,8,32,8,power_law_1.2,0.034534400701522826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,8,power_law_1.01,0.042316800355911253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,6144,16384,2,8,32,8,power_law_1.2,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,8,power_law_1.01,0.046828800439834596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,power_law_1.2,4.230630493164062
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,6144,16384,2,8,32,8,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,8,power_law_1.01,0.04785920083522797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,6144,16384,2,8,32,8,power_law_1.2,0.06362239718437195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,8,power_law_1.01,0.05235199928283692
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,8,power_law_1.01,0.05787519812583923
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,6144,16384,2,8,32,8,power_law_1.2,0.08798720240592957
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,8,power_law_1.01,0.06199679970741272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,6144,16384,2,8,32,8,power_law_1.2,0.10478719472885131
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,8,power_law_1.01,0.07427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,6144,16384,2,8,32,8,power_law_1.2,0.14287999868392945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,256,power_law_1.01,0.02136960029602051
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,8,power_law_1.01,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,6144,16384,2,8,32,8,power_law_1.2,0.18076800107955932
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,8,power_law_1.01,0.11032960414886475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,256,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,6144,16384,2,8,32,8,power_law_1.2,0.27660160064697265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,8,power_law_1.01,0.1379647970199585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,6144,16384,2,8,32,8,power_law_1.2,0.3263808012008667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,256,power_law_1.01,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,8,power_law_1.01,0.1850559949874878
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,6144,16384,2,8,32,8,power_law_1.2,0.4172800064086914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,256,power_law_1.01,0.021382400393486024
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,8,power_law_1.01,0.21784958839416504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,6144,16384,2,8,32,8,power_law_1.2,0.6380735874176026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,256,power_law_1.01,0.022195200622081756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,8,power_law_1.01,0.30304000377655027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,6144,16384,2,8,32,8,power_law_1.2,1.3141247749328613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,8,power_law_1.01,0.38535680770874026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,256,power_law_1.01,0.024460799992084503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,8,power_law_1.01,0.4650112152099609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,256,power_law_1.01,0.02917119860649109
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,8,power_law_1.01,0.7208191871643066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,256,power_law_1.01,0.027935999631881713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,8,power_law_1.01,1.5133952140808105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,256,power_law_1.01,0.03326080143451691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,1,256,power_law_1.2,0.021184000372886657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,256,power_law_1.01,0.035718399286270144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,1,256,power_law_1.2,0.020819200575351714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,256,power_law_1.01,0.03994880020618439
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,1,256,power_law_1.2,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,256,power_law_1.01,0.06198400259017944
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,256,power_law_1.01,0.038796800374984744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,1,256,power_law_1.2,0.02122880071401596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,256,power_law_1.01,0.05687040090560913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,256,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,1,256,power_law_1.2,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,256,power_law_1.01,0.0576960027217865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,256,power_law_1.01,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,256,power_law_1.01,0.05872640013694763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,1,256,power_law_1.2,0.026137599349021913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,256,power_law_1.01,0.04595839977264404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,256,power_law_1.01,0.05503360033035278
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,1,256,power_law_1.2,0.032287999987602234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,256,power_law_1.01,0.04821119904518127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,256,power_law_1.01,0.05666559934616089
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,1,256,power_law_1.2,0.032902398705482484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,256,power_law_1.01,0.05496320128440857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,256,power_law_1.01,0.057068800926208495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,1,256,power_law_1.2,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,256,power_law_1.01,0.05722879767417908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,256,power_law_1.01,0.05788800120353699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,1,256,power_law_1.2,0.04028159976005554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.01,0.07012479901313781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,256,power_law_1.01,0.0581055998802185
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,1,256,power_law_1.2,0.046623998880386354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.01,0.10166399478912354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,256,power_law_1.01,0.05994240045547485
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,1,256,power_law_1.2,0.05358719825744629
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.01,0.10986239910125732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,256,power_law_1.01,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,1,256,power_law_1.2,0.05912320017814636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.01,0.17497600317001344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,256,power_law_1.01,0.06095359921455383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,1,256,power_law_1.2,0.06855040192604064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,256,power_law_1.01,0.06384000182151794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.01,0.2069375991821289
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,1,256,power_law_1.2,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,256,power_law_1.01,0.06299520134925843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,1,256,power_law_1.2,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.01,0.29459199905395506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,256,power_law_1.01,0.06955519914627076
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,1,256,power_law_1.2,0.07365760207176208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.01,0.3780735969543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,256,power_law_1.01,0.06935679912567139
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,1,256,power_law_1.2,0.06914560198783874
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.01,0.6013696193695068
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,256,power_law_1.01,0.07427200078964233
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.2,0.08224639892578126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.01,0.7326464176177978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,256,power_law_1.01,0.0830847978591919
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.2,0.12608640193939208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,256,power_law_1.01,0.9743040084838868
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.01,0.0890175998210907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.2,0.1469823956489563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,256,power_law_1.01,1.3103743553161622
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.01,0.10929919481277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.2,0.2161855936050415
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.01,0.12239999771118164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.2,0.2749824047088623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,256,power_law_1.01,3.1652671813964846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.01,0.15864319801330568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.2,0.40358400344848633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.01,0.19101439714431762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.2,0.5227712154388428
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,1,256,power_law_1.2,0.06766719818115234
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.01,0.2542975902557373
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.2,0.7712063789367676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,1,256,power_law_1.2,0.06398079991340637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.01,0.3116224050521851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.2,1.0218751907348633
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,1,256,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.01,0.4347263813018799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,1,256,power_law_1.2,1.2651840209960938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,1,256,power_law_1.2,0.058246397972106935
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.01,0.5449024200439453
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,1,256,power_law_1.2,2.0165952682495116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,1,256,power_law_1.2,0.056601601839065555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,256,power_law_1.01,0.6757760047912598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,1,256,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,1,256,power_law_1.2,3.975302505493164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,256,power_law_1.01,1.0564800262451173
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,1,256,power_law_1.2,0.05742080211639404
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,1,256,power_law_1.2,0.05845119953155518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,256,power_law_1.01,2.1472448348999023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,1,256,power_law_1.2,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,1,256,power_law_1.2,0.060070401430130003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,128,power_law_1.01,0.02040960043668747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,1,256,power_law_1.2,0.06357120275497437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,128,power_law_1.01,0.020000000298023225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,1,256,power_law_1.2,0.061939197778701785
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,128,power_law_1.01,0.01998720020055771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,2,128,power_law_1.2,0.02082560062408447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,1,256,power_law_1.2,0.06396160125732422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,128,power_law_1.01,0.020000000298023225
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,2,128,power_law_1.2,0.020838400721549986
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,1,256,power_law_1.2,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,2,128,power_law_1.2,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,128,power_law_1.01,0.020812800526618956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,1,256,power_law_1.2,0.07032319903373718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,2,128,power_law_1.2,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,128,power_law_1.01,0.022860799729824067
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,1,256,power_law_1.2,0.0705344021320343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,2,128,power_law_1.2,0.023078399896621703
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,128,power_law_1.01,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,1,256,power_law_1.2,0.07647359967231751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,2,128,power_law_1.2,0.024512000381946564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,128,power_law_1.01,0.026553601026535034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,2,128,power_law_1.2,0.027584001421928406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,1,256,power_law_1.2,0.08446080088615418
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,128,power_law_1.01,0.03146879971027374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,2,128,power_law_1.2,0.028780800104141236
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.2,0.09715200066566468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,128,power_law_1.01,0.03311359882354736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,2,128,power_law_1.2,0.029625600576400755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,128,power_law_1.01,0.034745600819587705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.2,0.11763839721679688
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,2,128,power_law_1.2,0.033907198905944826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,128,power_law_1.01,0.04068480134010315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.2,0.13749760389328003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,2,128,power_law_1.2,0.03598720133304596
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,128,power_law_1.01,0.04353919923305512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.2,0.17846399545669556
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,2,128,power_law_1.2,0.041510400176048276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,128,power_law_1.01,0.050918400287628174
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.2,0.22268800735473632
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,2,128,power_law_1.2,0.04457600116729736
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,128,power_law_1.01,0.04374400079250336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.2,0.29191040992736816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,2,128,power_law_1.2,0.0531711995601654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,128,power_law_1.01,0.04620159864425659
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.2,0.3758975982666016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,2,128,power_law_1.2,0.046214398741722104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,128,power_law_1.01,0.05480960011482239
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.2,0.5665599822998046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,2,128,power_law_1.2,0.0515392005443573
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,128,power_law_1.01,0.05112959742546082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.2,0.7240511894226074
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,2,128,power_law_1.2,0.05726720094680786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,128,power_law_1.01,0.06177279949188232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,1,256,power_law_1.2,0.9149120330810547
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,2,128,power_law_1.2,0.056460797786712646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,128,power_law_1.01,0.08430079817771911
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,1,256,power_law_1.2,1.6071487426757813
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,2,128,power_law_1.2,0.06893439888954163
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,128,power_law_1.01,0.10315519571304321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,2,128,power_law_1.2,0.09312639832496643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,128,power_law_1.01,0.1444991946220398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,1,256,power_law_1.2,3.0761791229248048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,2,128,power_law_1.2,0.11871360540390015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,128,power_law_1.01,0.17434879541397094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,2,128,power_law_1.2,0.16909439563751222
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,128,power_law_1.01,0.2553024053573608
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,2,128,power_law_1.2,0.20616960525512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,128,power_law_1.01,0.06725760102272034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,128,power_law_1.01,0.3222912073135376
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,2,128,power_law_1.2,0.32515199184417726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,128,power_law_1.01,0.06643199920654297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,128,power_law_1.01,0.473203182220459
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,2,128,power_law_1.2,0.3800447940826416
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,128,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,128,power_law_1.01,0.6186048030853272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,2,128,power_law_1.2,0.656928014755249
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,128,power_law_1.01,0.0572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,128,power_law_1.01,0.76626558303833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,2,128,power_law_1.2,0.9481599807739258
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,128,power_law_1.01,0.057631999254226685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,128,power_law_1.01,1.2064000129699708
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,2,128,power_law_1.2,1.0892736434936523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,128,power_law_1.01,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,128,power_law_1.01,0.05988479852676391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,128,power_law_1.01,2.398124885559082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,2,128,power_law_1.2,1.7272192001342774
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,128,power_law_1.01,0.0603007972240448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,2,128,power_law_1.2,3.428684616088867
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,128,power_law_1.01,0.06092159748077393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,2,128,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,128,power_law_1.01,0.06213759779930115
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,2,128,power_law_1.2,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,128,power_law_1.01,0.06479359865188598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,2,128,power_law_1.2,0.0580735981464386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,128,power_law_1.01,0.06353920102119445
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,64,power_law_1.01,0.02082560062408447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,2,128,power_law_1.2,0.05420799851417542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,128,power_law_1.01,0.0658240020275116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,64,power_law_1.01,0.02041600048542023
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,2,128,power_law_1.2,0.05583999752998352
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,64,power_law_1.01,0.020403200387954713
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,64,power_law_1.01,0.02082560062408447
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,2,128,power_law_1.2,0.05720319747924805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,64,power_law_1.01,0.022470399737358093
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,2,128,power_law_1.2,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,64,power_law_1.01,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,2,128,power_law_1.2,0.058899199962615965
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,64,power_law_1.01,0.024512000381946564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,2,128,power_law_1.2,0.060134398937225345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,64,power_law_1.01,0.025331199169158936
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,2,128,power_law_1.2,0.06096000075340271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,6144,16384,2,8,32,8,power_law_1.2,0.04043520092964172
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,64,power_law_1.01,0.027167999744415285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,6144,16384,2,8,32,8,power_law_1.2,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,2,128,power_law_1.2,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,6144,16384,2,8,32,8,power_law_1.2,0.04084480106830597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,64,power_law_1.01,0.03188480138778686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,2,128,power_law_1.2,0.06464639902114869
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,6144,16384,2,8,32,8,power_law_1.2,0.04227840006351471
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,64,power_law_1.01,0.037811198830604555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,2,128,power_law_1.2,0.06342399716377259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,6144,16384,2,8,32,8,power_law_1.2,0.04188160002231598
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,64,power_law_1.01,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,6144,16384,2,8,32,8,power_law_1.2,0.04268800020217896
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,128,power_law_1.2,0.06606720089912414
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,6144,16384,2,8,32,8,power_law_1.2,0.04287360012531281
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,64,power_law_1.01,0.04252159893512726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,128,power_law_1.2,0.06997759938240052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,6144,16384,2,8,32,8,power_law_1.2,0.04965760111808777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,64,power_law_1.01,0.04927999973297119
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,128,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,6144,16384,2,8,32,8,power_law_1.2,0.05088000297546387
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,64,power_law_1.01,0.041920000314712526
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,6144,16384,2,8,32,8,power_law_1.2,0.05334399938583374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,128,power_law_1.2,0.07856000065803528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,6144,16384,2,8,32,8,power_law_1.2,0.057843202352523805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,64,power_law_1.01,0.04622080028057098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,128,power_law_1.2,0.08676480054855347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,6144,16384,2,8,32,8,power_law_1.2,0.06378239989280701
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,64,power_law_1.01,0.05768960118293762
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,128,power_law_1.2,0.09658240079879761
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,6144,16384,2,8,32,8,power_law_1.2,0.07607679963111877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,64,power_law_1.01,0.05255039930343628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,6144,16384,2,8,32,8,power_law_1.2,0.08959360122680664
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,128,power_law_1.2,0.12157440185546875
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,6144,16384,2,8,32,8,power_law_1.2,0.11662720441818238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,64,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,128,power_law_1.2,0.13631999492645264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,6144,16384,2,8,32,8,power_law_1.2,0.12789119482040406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,64,power_law_1.01,0.08101760149002075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,128,power_law_1.2,0.16663680076599122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,6144,16384,2,8,32,8,power_law_1.2,0.1774335980415344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,64,power_law_1.01,0.10724480152130127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,6144,16384,2,8,32,8,power_law_1.2,0.21083519458770753
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,128,power_law_1.2,0.20840320587158204
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,64,power_law_1.01,0.14369280338287355
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,6144,16384,2,8,32,8,power_law_1.2,0.3089344024658203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,128,power_law_1.2,0.28009600639343263
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,6144,16384,2,8,32,8,power_law_1.2,0.39371519088745116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,64,power_law_1.01,0.17032320499420167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,128,power_law_1.2,0.36773760318756105
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,6144,16384,2,8,32,8,power_law_1.2,0.48095998764038084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,64,power_law_1.01,0.2512128114700317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,6144,16384,2,8,32,8,power_law_1.2,0.7547776222229003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,128,power_law_1.2,0.49697279930114746
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,64,power_law_1.01,0.3529983997344971
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,6144,16384,2,8,32,8,power_law_1.2,1.4744511604309083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,128,power_law_1.2,0.6859968185424805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,64,power_law_1.01,0.48101119995117186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,128,power_law_1.2,0.8264960289001465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,64,power_law_1.01,0.5984960079193116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,128,power_law_1.2,1.3599935531616212
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,64,power_law_1.01,0.7871679782867431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,4,64,power_law_1.2,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,4,64,power_law_1.2,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,64,power_law_1.01,1.3067456245422364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,128,power_law_1.2,2.882080078125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,4,64,power_law_1.2,0.02056960016489029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,64,power_law_1.01,2.653715133666992
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,4,64,power_law_1.2,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,4,64,power_law_1.2,0.02200320065021515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,64,power_law_1.01,0.0648576021194458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,4,64,power_law_1.2,0.02426239997148514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,64,power_law_1.01,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,4,64,power_law_1.2,0.07120000123977661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,4,64,power_law_1.2,0.025484800338745117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,64,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,4,64,power_law_1.2,0.06628479957580566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,4,64,power_law_1.2,0.027532801032066345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,64,power_law_1.01,0.05644800066947937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,4,64,power_law_1.2,0.05420799851417542
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,4,64,power_law_1.2,0.03531520068645477
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,64,power_law_1.01,0.05973119735717773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,4,64,power_law_1.2,0.05544319748878479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,4,64,power_law_1.2,0.036959999799728395
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,64,power_law_1.01,0.06093440055847168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,4,64,power_law_1.2,0.058911997079849246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,4,64,power_law_1.2,0.040031999349594116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,64,power_law_1.01,0.06218240261077881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,4,64,power_law_1.2,0.059935998916625974
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,4,64,power_law_1.2,0.04391680061817169
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,64,power_law_1.01,0.06074879765510559
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,4,64,power_law_1.2,0.04720639884471893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,4,64,power_law_1.2,0.060755199193954466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,64,power_law_1.01,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,4,64,power_law_1.2,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,4,64,power_law_1.2,0.06158080101013184
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,64,power_law_1.01,0.06383360028266907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,4,64,power_law_1.2,0.047200000286102294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,4,64,power_law_1.2,0.06259840130805969
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,64,power_law_1.01,0.06629120111465454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,4,64,power_law_1.2,0.05108479857444763
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,4,64,power_law_1.2,0.06403840184211732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,64,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,4,64,power_law_1.2,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,4,64,power_law_1.2,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,64,power_law_1.01,0.0677183985710144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,4,64,power_law_1.2,0.0590719997882843
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,4,64,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,64,power_law_1.01,0.06669440269470214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,4,64,power_law_1.2,0.07136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,4,64,power_law_1.2,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,64,power_law_1.01,0.07448319792747497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,4,64,power_law_1.2,0.09408000111579895
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,4,64,power_law_1.2,0.06872959733009339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,64,power_law_1.01,0.07428479790687562
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,4,64,power_law_1.2,0.11355520486831665
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,4,64,power_law_1.2,0.07362560033798218
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,64,power_law_1.01,0.08020480275154114
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,4,64,power_law_1.2,0.16208640336990357
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,4,64,power_law_1.2,0.07611520290374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,64,power_law_1.01,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,4,64,power_law_1.2,0.07898880243301391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,4,64,power_law_1.2,0.20119040012359618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,64,power_law_1.01,0.0949567973613739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,4,64,power_law_1.2,0.08883200287818908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,4,64,power_law_1.2,0.2851648092269897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,64,power_law_1.01,0.11277439594268798
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,4,64,power_law_1.2,0.09701120257377624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,4,64,power_law_1.2,0.3683135986328125
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,64,power_law_1.01,0.12814719676971437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,4,64,power_law_1.2,0.1150272011756897
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,4,64,power_law_1.2,0.5538559913635254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,64,power_law_1.01,0.16705280542373657
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,4,64,power_law_1.2,0.13305599689483644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,64,power_law_1.01,0.1922368049621582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,4,64,power_law_1.2,0.728550386428833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,4,64,power_law_1.2,0.17523839473724365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,64,power_law_1.01,0.2559295892715454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,4,64,power_law_1.2,0.9030591964721679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,4,64,power_law_1.2,0.1985856056213379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,64,power_law_1.01,0.32023038864135744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,4,64,power_law_1.2,1.3865792274475097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,4,64,power_law_1.2,0.27640318870544434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,64,power_law_1.01,0.4457856178283691
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,4,64,power_law_1.2,2.7730560302734375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,4,64,power_law_1.2,0.336627197265625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,64,power_law_1.01,0.5682432174682617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,4,64,power_law_1.2,0.5195072174072266
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,64,power_law_1.01,0.6909183979034423
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,4,64,power_law_1.2,0.6333568096160889
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,32,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,64,power_law_1.01,1.1072768211364745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,32,power_law_1.01,0.021388800442218782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,4,64,power_law_1.2,0.7662847995758056
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,32,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,64,power_law_1.01,2.0804864883422853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,4,64,power_law_1.2,1.2174592018127441
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,32,power_law_1.01,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,32,power_law_1.01,0.02221439927816391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,4,64,power_law_1.2,2.642655944824219
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,8,32,power_law_1.2,0.021638399362564086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,32,power_law_1.01,0.024460799992084503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,8,32,power_law_1.2,0.021631999313831328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,32,power_law_1.01,0.02733440101146698
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,8,32,power_law_1.2,0.02101760059595108
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,32,power_law_1.01,0.02876800000667572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,8,32,power_law_1.2,0.021222400665283202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,32,power_law_1.01,0.031430399417877196
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,8,32,power_law_1.2,0.022041599452495574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,32,power_law_1.01,0.03367680013179779
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,32,power_law_1.01,0.039001598954200745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,8,32,power_law_1.2,0.02470400035381317
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,32,power_law_1.01,0.04822399914264679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,8,32,power_law_1.2,0.026553601026535034
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,32,power_law_1.01,0.0531391978263855
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,8,32,power_law_1.2,0.029017600417137145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,32,power_law_1.01,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,8,32,power_law_1.2,0.03023360073566437
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,32,power_law_1.01,0.05047680139541626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,8,32,power_law_1.2,0.033107200264930726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,32,power_law_1.01,0.05621119737625122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,8,32,power_law_1.2,0.037190398573875426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,32,power_law_1.01,0.06664959788322448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,8,32,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,32,power_law_1.01,0.06500480175018311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,8,32,power_law_1.2,0.052153599262237546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,32,power_law_1.01,0.07730559706687927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,8,32,power_law_1.2,0.06178560256958008
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,32,power_law_1.01,0.08693119883537292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,32,power_law_1.01,0.101254403591156
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,32,power_law_1.01,0.14465919733047486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,32,power_law_1.01,0.183513605594635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,32,power_law_1.01,0.2552704095840454
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,32,power_law_1.01,0.3296128034591675
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,32,power_law_1.01,0.4797311782836914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,32,power_law_1.01,0.640499210357666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,32,power_law_1.01,0.7883711814880371
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,32,power_law_1.01,1.2522432327270507
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,32,power_law_1.01,2.475116729736328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,32,power_law_1.2,0.07730559706687927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,32,power_law_1.2,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,32,power_law_1.2,0.0578495979309082
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,32,power_law_1.2,0.05989760160446167
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,32,power_law_1.2,0.06112639904022217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,32,power_law_1.2,0.06494719982147217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,32,power_law_1.2,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,32,power_law_1.2,0.06645119786262513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,2,128,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,32,power_law_1.2,0.0693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,2,128,power_law_1.01,0.07095040082931518
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,32,power_law_1.2,0.0680895984172821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,2,128,power_law_1.01,0.07196159958839417
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,32,power_law_1.2,0.06848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,2,128,power_law_1.01,0.07769600152969361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,32,power_law_1.2,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,2,128,power_law_1.01,0.08528000116348267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,32,power_law_1.2,0.07259520292282104
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,2,128,power_law_1.01,0.09264000058174134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,32,power_law_1.2,0.07361279726028443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,2,128,power_law_1.01,0.11088639497756958
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,32,power_law_1.2,0.0807807981967926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,2,128,power_law_1.01,0.12705279588699342
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,32,power_law_1.2,0.08283519744873047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,32,power_law_1.2,0.08672639727592468
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,2,128,power_law_1.01,0.16187520027160646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,32,power_law_1.2,0.09696639776229858
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,2,128,power_law_1.01,0.19196799993515015
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,32,power_law_1.2,0.10945279598236084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,2,128,power_law_1.01,0.2529855966567993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,32,power_law_1.2,0.12992000579833984
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,2,128,power_law_1.01,0.30298240184783937
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,32,power_law_1.2,0.14529279470443726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,2,128,power_law_1.01,0.43795199394226075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,32,power_law_1.2,0.1835904002189636
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,2,128,power_law_1.01,0.5472959995269775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,32,power_law_1.2,0.222489595413208
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,2,128,power_law_1.01,0.6859519958496094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,32,power_law_1.2,0.2962368011474609
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,2,128,power_law_1.01,1.01977596282959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,32,power_law_1.2,0.37690880298614504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,32,power_law_1.2,0.5079999923706054
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,2,128,power_law_1.01,2.053945541381836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,32,power_law_1.2,0.7191296100616456
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,32,power_law_1.2,0.8780735969543457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,16,power_law_1.01,0.02178560048341751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,32,power_law_1.2,1.2423168182373048
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,16,power_law_1.01,0.023423999547958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,32,power_law_1.2,2.672928047180176
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,16,power_law_1.01,0.02178560048341751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,16,power_law_1.01,0.022201600670814513
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,16,power_law_1.01,0.02343039959669113
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,7168,2048,8,256,16,16,power_law_1.2,0.022617599368095397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,16,power_law_1.01,0.026713600754737853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,7168,2048,8,256,16,16,power_law_1.2,0.024255999922752382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,16,power_law_1.01,0.028960001468658448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,7168,2048,8,256,16,16,power_law_1.2,0.021798400580883025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,16,power_law_1.01,0.030393600463867188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,7168,2048,8,256,16,16,power_law_1.2,0.02221439927816391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,16,power_law_1.01,0.033055999875068666
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,7168,2048,8,256,16,16,power_law_1.2,0.024057599902153014
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,16,power_law_1.01,0.03449600040912628
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,7168,2048,8,256,16,16,power_law_1.2,0.02632319927215576
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,16,power_law_1.01,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,7168,2048,8,256,16,16,power_law_1.2,0.02876800000667572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,16,power_law_1.01,0.04350079894065857
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,7168,2048,8,256,16,16,power_law_1.2,0.031225600838661195
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,16,power_law_1.01,0.047577598690986635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,7168,2048,8,256,16,16,power_law_1.2,0.033267199993133545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,16,power_law_1.01,0.05886080265045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,7168,2048,8,256,16,16,power_law_1.2,0.03532159924507141
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,16,power_law_1.01,0.04657280147075653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,7168,2048,8,256,16,16,power_law_1.2,0.039603200554847715
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,16,power_law_1.01,0.05189120173454285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,7168,2048,8,256,16,16,power_law_1.2,0.04433279931545257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,16,power_law_1.01,0.0615231990814209
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,7168,2048,8,256,16,16,power_law_1.2,0.04842880070209503
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,16,power_law_1.01,0.05987840294837952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,7168,2048,8,256,16,16,power_law_1.2,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,16,power_law_1.01,0.077702397108078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,16,16,power_law_1.2,0.047814399003982544
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,16,power_law_1.01,0.08117759823799134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,16,16,power_law_1.2,0.053548800945281985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,16,power_law_1.01,0.09859200119972229
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,16,16,power_law_1.2,0.06518399715423584
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,16,power_law_1.01,0.1356608033180237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,16,16,power_law_1.2,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,16,power_law_1.01,0.1639232039451599
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,16,16,power_law_1.2,0.0815936028957367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,16,power_law_1.01,0.22945280075073243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,16,16,power_law_1.2,0.08120319843292237
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,16,power_law_1.01,0.29416959285736083
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,16,16,power_law_1.2,0.1033087968826294
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,16,power_law_1.01,0.4391744136810303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,16,16,power_law_1.2,0.13935999870300292
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,16,power_law_1.01,0.568614387512207
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,16,16,power_law_1.2,0.18844159841537475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,16,16,power_law_1.2,0.25793919563293455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,16,power_law_1.01,0.7137407779693603
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,16,16,power_law_1.2,0.3240895986557007
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,16,power_law_1.01,1.1658111572265626
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,16,16,power_law_1.2,0.4842368125915527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,16,power_law_1.01,2.2360767364501952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,16,16,power_law_1.2,0.6296256065368653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,16,16,power_law_1.2,0.7846784114837646
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,16,16,power_law_1.2,1.2444479942321778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,16,power_law_1.01,0.07134720087051391
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,16,power_law_1.01,0.08284159898757934
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,16,16,power_law_1.2,2.564729690551758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,16,power_law_1.01,0.06398720145225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,16,power_law_1.01,0.061926400661468504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,16,power_law_1.01,0.06398720145225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,16,16,power_law_1.2,0.07198079824447631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,16,power_law_1.01,0.06746879816055298
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,16,16,power_law_1.2,0.08323839902877808
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,16,power_law_1.01,0.07177600264549255
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,16,16,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,16,power_law_1.01,0.07422080039978027
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,16,16,power_law_1.2,0.06316800117492676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,16,power_law_1.01,0.0742143988609314
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,16,16,power_law_1.2,0.06522240042686463
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,16,16,power_law_1.2,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,16,power_law_1.01,0.07667840123176575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,16,16,power_law_1.2,0.07176960110664368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,16,power_law_1.01,0.07831680178642272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,16,16,power_law_1.2,0.0736191987991333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,16,power_law_1.01,0.07872639894485474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,16,16,power_law_1.2,0.07361279726028443
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,16,power_law_1.01,0.07831040024757385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,16,16,power_law_1.2,0.07749119997024537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,16,power_law_1.01,0.08077440261840821
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,256,8,32,power_law_1.01,0.07653120160102844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,16,16,power_law_1.2,0.0797439992427826
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,256,8,32,power_law_1.01,0.06587520241737366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,16,power_law_1.01,0.088755202293396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,16,16,power_law_1.2,0.0791487991809845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,16,power_law_1.01,0.08876799941062927
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,256,8,32,power_law_1.01,0.05850239992141724
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,16,16,power_law_1.2,0.07914239764213563
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,16,power_law_1.01,0.09387519955635071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,256,8,32,power_law_1.01,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,16,16,power_law_1.2,0.08119680285453797
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,256,8,32,power_law_1.01,0.06096640229225159
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,16,power_law_1.01,0.1049407958984375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,16,16,power_law_1.2,0.08877440094947815
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,16,power_law_1.01,0.11845760345458985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,256,8,32,power_law_1.01,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,16,16,power_law_1.2,0.09081599712371827
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,256,8,32,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,16,power_law_1.01,0.14321919679641723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,16,16,power_law_1.2,0.09716479778289795
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,256,8,32,power_law_1.01,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,16,power_law_1.01,0.15715839862823486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,16,16,power_law_1.2,0.1123263955116272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,256,8,32,power_law_1.01,0.06607999801635742
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,16,power_law_1.01,0.2069119930267334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,16,16,power_law_1.2,0.12092800140380859
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,256,8,32,power_law_1.01,0.06711040139198303
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,16,power_law_1.01,0.22187519073486328
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,16,16,power_law_1.2,0.1442752003669739
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,256,8,32,power_law_1.01,0.0677183985710144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,16,power_law_1.01,0.30196480751037597
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,16,16,power_law_1.2,0.1631168007850647
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,256,8,32,power_law_1.01,0.06936320066452026
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,16,power_law_1.01,0.36934399604797363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,7168,2048,8,256,8,32,power_law_1.2,0.050521600246429446
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,16,16,power_law_1.2,0.21635839939117432
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,256,8,32,power_law_1.01,0.07100800275802613
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,7168,2048,8,256,8,32,power_law_1.2,0.056441599130630495
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,16,power_law_1.01,0.5415679931640625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,16,16,power_law_1.2,0.24339840412139893
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,256,8,32,power_law_1.01,0.07344639897346497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,7168,2048,8,256,8,32,power_law_1.2,0.06546559929847717
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,16,power_law_1.01,0.6994751930236817
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,256,8,32,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,16,16,power_law_1.2,0.32366080284118653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,7168,2048,8,256,8,32,power_law_1.2,0.06504319906234741
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,16,power_law_1.01,0.843238353729248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,256,8,32,power_law_1.01,0.07857279777526856
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,16,16,power_law_1.2,0.39843199253082273
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,7168,2048,8,256,8,32,power_law_1.2,0.07835519909858704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,16,power_law_1.01,1.2387200355529786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,256,8,32,power_law_1.01,0.08267520070075988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,16,16,power_law_1.2,0.5886720180511474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,7168,2048,8,256,8,32,power_law_1.2,0.08799359798431397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,256,8,32,power_law_1.01,0.09065600037574768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,7168,2048,8,256,8,32,power_law_1.2,0.10559359788894654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,16,16,power_law_1.2,0.7551936149597168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,16,power_law_1.01,2.529971122741699
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,256,8,32,power_law_1.01,0.10088959932327271
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,7168,2048,8,256,8,32,power_law_1.2,0.15088000297546386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,16,16,power_law_1.2,0.9116479873657226
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,256,8,32,power_law_1.01,0.12466559410095215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,7168,2048,8,256,8,32,power_law_1.2,0.18465919494628907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,16,16,power_law_1.2,1.3857664108276366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,128,power_law_1.01,0.018483200669288637
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,256,8,32,power_law_1.01,0.13735040426254272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,7168,2048,8,256,8,32,power_law_1.2,0.26206719875335693
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,128,power_law_1.01,0.02094080001115799
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,256,8,32,power_law_1.01,0.1740031957626343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,16,16,power_law_1.2,3.084774398803711
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,7168,2048,8,256,8,32,power_law_1.2,0.3507391929626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,128,power_law_1.01,0.018719999492168425
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,256,8,32,power_law_1.01,0.20678400993347168
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,7168,2048,8,256,8,32,power_law_1.2,0.474015998840332
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,128,power_law_1.01,0.018515199422836304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,256,8,32,power_law_1.01,0.2735424041748047
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,7168,2048,8,256,8,32,power_law_1.2,0.6839935779571533
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,128,power_law_1.01,0.019539199769496918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,2,128,power_law_1.2,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,256,8,32,power_law_1.01,0.32106239795684816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,128,power_law_1.01,0.019948799908161164
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,2,128,power_law_1.2,0.018726399540901183
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,7168,2048,8,256,8,32,power_law_1.2,0.8371647834777832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,256,8,32,power_law_1.01,0.46175360679626465
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,128,power_law_1.01,0.020351999998092653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,2,128,power_law_1.2,0.018931199610233308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,7168,2048,8,256,8,32,power_law_1.2,1.404646396636963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,128,power_law_1.01,0.021376000344753267
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,2,128,power_law_1.2,0.01852159947156906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,256,8,32,power_law_1.01,0.6083775997161865
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,128,power_law_1.01,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,2,128,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,256,8,32,power_law_1.01,0.7273791790008545
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,7168,2048,8,256,8,32,power_law_1.2,2.840716743469238
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,2,128,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,128,power_law_1.01,0.02260479927062988
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,256,8,32,power_law_1.01,1.1461888313293458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,2,128,power_law_1.2,0.020972800254821778
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,128,power_law_1.01,0.025062400102615356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,2,128,power_law_1.2,0.021804800629615782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,128,power_law_1.01,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,128,power_law_1.01,0.023635199666023253
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,256,8,32,power_law_1.01,2.2332544326782227
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,2,128,power_law_1.2,0.022009600698947907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,128,power_law_1.01,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,128,power_law_1.01,0.02383359968662262
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,2,128,power_law_1.2,0.022617599368095397
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,128,power_law_1.01,0.03637759983539581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,128,power_law_1.01,0.026092800498008727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,2,128,power_law_1.2,0.02508159875869751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,128,power_law_1.01,0.03761279881000519
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,2,128,power_law_1.2,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,128,power_law_1.01,0.02588160037994385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,2,128,power_law_1.2,0.024275200068950654
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,128,power_law_1.01,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,2,128,power_law_1.2,0.03739520013332367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,128,power_law_1.01,0.026707199215888978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,2,128,power_law_1.2,0.024639999866485594
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,2,128,power_law_1.2,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,128,power_law_1.01,0.029164800047874452
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,2,128,power_law_1.2,0.02794879972934723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,2,128,power_law_1.2,0.036595198512077334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,128,power_law_1.01,0.03325439989566803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,2,128,power_law_1.2,0.026713600754737853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,2,128,power_law_1.2,0.03699840009212494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,128,power_law_1.01,0.03920640051364899
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,2,128,power_law_1.2,0.02773759961128235
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,128,power_law_1.2,0.038022398948669434
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,128,power_law_1.01,0.04903680086135864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,2,128,power_law_1.2,0.03038719892501831
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,128,power_law_1.2,0.037190398573875426
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,128,power_law_1.01,0.057004797458648684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,2,128,power_law_1.2,0.03470720052719116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,128,power_law_1.2,0.036595198512077334
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,128,power_law_1.01,0.06889600157737732
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,2,128,power_law_1.2,0.04513919949531555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,128,power_law_1.2,0.03781760036945343
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,128,power_law_1.01,0.09018880128860474
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,2,128,power_law_1.2,0.05127679705619812
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,128,power_law_1.2,0.03823359906673431
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,128,power_law_1.01,0.12910720109939575
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,2,128,power_law_1.2,0.05886719822883606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,128,power_law_1.2,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,128,power_law_1.01,0.15491199493408203
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,2,128,power_law_1.2,0.07709439992904663
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,128,power_law_1.2,0.03863680064678192
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,128,power_law_1.01,0.20672640800476075
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,2,128,power_law_1.2,0.09840000271797181
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,128,power_law_1.2,0.04152320027351379
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,128,power_law_1.01,0.28558080196380614
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,128,power_law_1.2,0.04293760061264038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,2,128,power_law_1.2,0.13868800401687623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,128,power_law_1.01,0.36421120166778564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,128,power_law_1.2,0.04580479860305786
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,2,128,power_law_1.2,0.17212799787521363
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,128,power_law_1.01,0.5640960216522217
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,128,power_law_1.2,0.0456063985824585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,2,128,power_law_1.2,0.2511744022369385
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,128,power_law_1.2,0.04764800071716309
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,2,128,power_law_1.2,0.312006402015686
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,128,power_law_1.01,1.0332927703857422
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,128,power_law_1.2,0.052767997980117796
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,2,128,power_law_1.2,0.3982144117355347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,128,power_law_1.2,0.057683199644088745
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,2,128,power_law_1.2,0.6177536010742187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,128,power_law_1.2,0.06691200137138367
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,64,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,128,power_law_1.2,0.07734400033950806
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,2,128,power_law_1.2,1.210860824584961
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,64,power_law_1.01,0.018508799374103546
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,128,power_law_1.2,0.1000704050064087
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,64,power_law_1.01,0.01892479956150055
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,128,power_law_1.2,0.12445440292358398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,64,power_law_1.01,0.01854719966650009
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,128,power_law_1.2,0.1654080033302307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1,4096,1536,8,128,4,64,power_law_1.2,0.018931199610233308
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,64,power_law_1.01,0.019942399859428406
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,128,power_law_1.2,0.20062720775604248
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2,4096,1536,8,128,4,64,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,64,power_law_1.01,0.019731199741363524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4,4096,1536,8,128,4,64,power_law_1.2,0.019340799748897554
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,128,power_law_1.2,0.28745601177215574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,64,power_law_1.01,0.02014079988002777
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8,4096,1536,8,128,4,64,power_law_1.2,0.019539199769496918
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,128,power_law_1.2,0.3591487884521484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,64,power_law_1.01,0.02056960016489029
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16,4096,1536,8,128,4,64,power_law_1.2,0.019142399728298187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,128,power_law_1.2,0.4293951988220215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,64,power_law_1.01,0.021996800601482392
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32,4096,1536,8,128,4,64,power_law_1.2,0.020153599977493285
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,64,power_law_1.01,0.023014399409294128
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,128,power_law_1.2,0.6950208187103272
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,48,4096,1536,8,128,4,64,power_law_1.2,0.020979200303554536
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,64,power_law_1.01,0.024255999922752382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,64,4096,1536,8,128,4,64,power_law_1.2,0.02200320065021515
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,128,power_law_1.2,1.3432127952575683
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,80,4096,1536,8,128,4,64,power_law_1.2,0.02160000056028366
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,64,power_law_1.01,0.023839999735355378
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,96,4096,1536,8,128,4,64,power_law_1.2,0.023846399784088135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,64,power_law_1.01,0.024255999922752382
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,128,4096,1536,8,128,4,64,power_law_1.2,0.023846399784088135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,64,power_law_1.01,0.02505599856376648
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,64,power_law_1.01,0.03966079950332642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,160,4096,1536,8,128,4,64,power_law_1.2,0.023846399784088135
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,64,power_law_1.01,0.026707199215888978
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,64,power_law_1.01,0.03885439932346344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,192,4096,1536,8,128,4,64,power_law_1.2,0.025062400102615356
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,64,power_law_1.01,0.027532801032066345
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,64,power_law_1.01,0.03883520066738129
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,256,4096,1536,8,128,4,64,power_law_1.2,0.02794240117073059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,64,power_law_1.01,0.030188798904418945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,64,power_law_1.01,0.03617919981479645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,320,4096,1536,8,128,4,64,power_law_1.2,0.02754560112953186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,64,power_law_1.01,0.037196800112724304
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,64,power_law_1.01,0.03407360017299652
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,384,4096,1536,8,128,4,64,power_law_1.2,0.02876800000667572
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,64,power_law_1.01,0.03924480080604553
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,64,power_law_1.01,0.04085119962692261
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,512,4096,1536,8,128,4,64,power_law_1.2,0.030822399258613586
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,64,power_law_1.01,0.03841919898986816
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,64,power_law_1.01,0.048614400625228885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,768,4096,1536,8,128,4,64,power_law_1.2,0.03573119938373566
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,64,power_law_1.01,0.03904640078544617
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,64,power_law_1.01,0.05680000185966492
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1024,4096,1536,8,128,4,64,power_law_1.2,0.04392319917678833
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,64,power_law_1.01,0.039052799344062805
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,64,power_law_1.01,0.07954559922218322
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,1536,4096,1536,8,128,4,64,power_law_1.2,0.05454720258712768
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,64,power_law_1.01,0.03986560106277466
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,64,power_law_1.01,0.09818239808082581
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,2048,4096,1536,8,128,4,64,power_law_1.2,0.06807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,64,power_law_1.01,0.04068480134010315
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,64,power_law_1.01,0.1295040011405945
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,3072,4096,1536,8,128,4,64,power_law_1.2,0.08242560029029847
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,64,power_law_1.01,0.04089600145816803
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,64,power_law_1.01,0.1739583969116211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,4096,4096,1536,8,128,4,64,power_law_1.2,0.10780800580978393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,64,power_law_1.01,0.042131200432777405
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,64,power_law_1.01,0.24337921142578126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,6144,4096,1536,8,128,4,64,power_law_1.2,0.14366079568862916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,64,power_law_1.01,0.04417920112609863
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,64,power_law_1.01,0.30094079971313475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,8192,4096,1536,8,128,4,64,power_law_1.2,0.18993279933929444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,64,power_law_1.01,0.0470335990190506
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,12288,4096,1536,8,128,4,64,power_law_1.2,0.2790271997451782
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,64,power_law_1.01,0.04847359955310822
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,64,power_law_1.01,0.4082176208496094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,64,power_law_1.01,0.04970879852771759
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,16384,4096,1536,8,128,4,64,power_law_1.2,0.37405440807342527
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,64,power_law_1.01,0.6300352096557618
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,64,power_law_1.01,0.05418879985809326
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,20480,4096,1536,8,128,4,64,power_law_1.2,0.4600639820098877
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,64,power_law_1.01,1.161695957183838
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,64,power_law_1.01,0.058508801460266116
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,32768,4096,1536,8,128,4,64,power_law_1.2,0.7121664047241211
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,64,power_law_1.01,0.0630079984664917
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,64,power_law_1.01,0.0728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow_min_latency,nvfp4,65536,4096,1536,8,128,4,64,power_law_1.2,1.4312255859375
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,4096,1536,8,128,4,64,power_law_1.2,0.04307839870452881
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,64,power_law_1.01,0.08327680230140685
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,4096,1536,8,128,4,64,power_law_1.2,0.03816959857940674
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,64,power_law_1.01,0.1054144024848938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,4096,1536,8,128,4,64,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,128,power_law_1.01,0.07219200134277344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,64,power_law_1.01,0.13960959911346435
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,4096,1536,8,128,4,64,power_law_1.2,0.03857919871807099
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,64,power_law_1.01,0.1572160005569458
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,128,power_law_1.01,0.0705407977104187
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,4096,1536,8,128,4,64,power_law_1.2,0.03899520039558411
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,64,power_law_1.01,0.2272576093673706
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,4,64,power_law_1.2,0.03958399891853333
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,128,power_law_1.01,0.061945599317550656
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,4,64,power_law_1.2,0.03898879885673523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,64,power_law_1.01,0.29320321083068845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,128,power_law_1.01,0.059059202671051025
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,4,64,power_law_1.2,0.0398144006729126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,64,power_law_1.01,0.3456831932067871
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,128,power_law_1.01,0.05927680134773254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,4,64,power_law_1.2,0.03939839899539947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,64,power_law_1.01,0.5162240028381347
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,128,power_law_1.01,0.059487998485565186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,4,64,power_law_1.2,0.04022400081157684
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,128,power_law_1.01,0.061324799060821535
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,4,64,power_law_1.2,0.041459199786186215
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,64,power_law_1.01,1.1412863731384277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,4,64,power_law_1.2,0.04267520010471344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,128,power_law_1.01,0.06358399987220764
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,4,64,power_law_1.2,0.04349440038204193
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,128,power_law_1.01,0.06417919993400574
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,4,64,power_law_1.2,0.04288640022277832
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,2,128,power_law_1.2,0.06217600107192993
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,128,power_law_1.01,0.06480640172958374
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,4,64,power_law_1.2,0.04636160135269165
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,2,128,power_law_1.2,0.061990398168563846
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,128,power_law_1.01,0.0664255976676941
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,4,64,power_law_1.2,0.048204800486564635
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,2,128,power_law_1.2,0.06218879818916321
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,128,power_law_1.01,0.06892160177230836
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,4,64,power_law_1.2,0.052102398872375486
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,4,64,power_law_1.2,0.05639680027961731
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,128,power_law_1.01,0.06972799897193908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,2,128,power_law_1.2,0.055219197273254396
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,4,64,power_law_1.2,0.05927680134773254
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,128,power_law_1.01,0.06993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,2,128,power_law_1.2,0.05809280276298523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,4,64,power_law_1.2,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,128,power_law_1.01,0.07546240091323853
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,2,128,power_law_1.2,0.05847679972648621
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,4,64,power_law_1.2,0.07871999740600585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,128,power_law_1.01,0.0787392020225525
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,2,128,power_law_1.2,0.060153597593307497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,4,64,power_law_1.2,0.10862079858779908
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,128,power_law_1.01,0.08200960159301758
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,2,128,power_law_1.2,0.0605567991733551
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,4,64,power_law_1.2,0.1229632019996643
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,4,64,power_law_1.2,0.17169920206069947
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,128,power_law_1.01,0.09123200178146362
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,2,128,power_law_1.2,0.061791998147964475
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,4,64,power_law_1.2,0.20364160537719728
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,128,power_law_1.01,0.09941120147705078
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,2,128,power_law_1.2,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,4,64,power_law_1.2,0.3160959959030151
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,128,power_law_1.01,0.12215679883956909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,2,128,power_law_1.2,0.06423680186271667
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,4,64,power_law_1.2,0.37608320713043214
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,128,power_law_1.01,0.1430400013923645
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,2,128,power_law_1.2,0.06650879979133606
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,4,64,power_law_1.2,0.4866879940032959
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,128,power_law_1.01,0.18543360233306885
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,2,128,power_law_1.2,0.06711680293083191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,4,64,power_law_1.2,0.8702848434448243
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,128,power_law_1.01,0.21676158905029297
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,2,128,power_law_1.2,0.06731520295143127
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,4,64,power_law_1.2,1.5932160377502442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,128,power_law_1.01,0.2913216114044189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,2,128,power_law_1.2,0.07324159741401673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,2,128,power_law_1.2,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,128,power_law_1.01,0.3557568073272705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,2,128,power_law_1.2,0.08246399760246277
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,128,power_law_1.01,0.47769598960876464
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,64,power_law_1.01,0.0789247989654541
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,2,128,power_law_1.2,0.0920960009098053
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,128,power_law_1.01,0.6368000030517578
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,64,power_law_1.01,0.07791360020637512
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,2,128,power_law_1.2,0.10336639881134033
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,128,power_law_1.01,0.7658432006835938
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,64,power_law_1.01,0.06930559873580933
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,2,128,power_law_1.2,0.12524800300598143
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,64,power_law_1.01,0.05947520136833191
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,128,power_law_1.01,1.158835220336914
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,2,128,power_law_1.2,0.14370559453964232
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,64,power_law_1.01,0.06151679754257202
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,2,128,power_law_1.2,0.18999040126800537
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,128,power_law_1.01,2.3419776916503907
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,64,power_law_1.01,0.06295040249824524
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,2,128,power_law_1.2,0.22049920558929442
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,64,power_law_1.01,0.06356480121612548
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,2,128,power_law_1.2,0.3161344051361084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,64,power_law_1.01,0.06439679861068726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,4,64,power_law_1.2,0.07894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,2,128,power_law_1.2,0.3816767930984497
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,64,power_law_1.01,0.06664959788322448
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,4,64,power_law_1.2,0.07751039862632751
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,2,128,power_law_1.2,0.5739967823028564
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,64,power_law_1.01,0.06684799790382386
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,4,64,power_law_1.2,0.07013760209083557
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,2,128,power_law_1.2,0.6905216217041016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,64,power_law_1.01,0.07032319903373718
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,4,64,power_law_1.2,0.05907840132713318
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,64,power_law_1.01,0.07012479901313781
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,4,64,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,2,128,power_law_1.2,0.8596863746643066
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,64,power_law_1.01,0.07278079986572265
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,4,64,power_law_1.2,0.06235520243644714
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,2,128,power_law_1.2,1.3657407760620117
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,4,64,power_law_1.2,0.06399359703063964
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,64,power_law_1.01,0.07134079933166504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,2,128,power_law_1.2,2.8427648544311523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,64,power_law_1.01,0.07913600206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,4,64,power_law_1.2,0.06562560200691223
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,64,power_law_1.01,0.07873280048370361
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,4,64,power_law_1.2,0.06604160070419311
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,64,power_law_1.01,0.0840448021888733
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,4,64,power_law_1.2,0.06725119948387145
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,4096,1536,8,128,2,128,power_law_1.01,0.03720319867134094
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,32,power_law_1.01,0.07182719707489013
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,64,power_law_1.01,0.09364479780197144
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,4,64,power_law_1.2,0.06888960003852844
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,4096,1536,8,128,2,128,power_law_1.01,0.03842560052871704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,32,power_law_1.01,0.07285119891166687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,64,power_law_1.01,0.10616960525512695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,4,64,power_law_1.2,0.07320320010185241
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,4096,1536,8,128,2,128,power_law_1.01,0.038431999087333676
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,32,power_law_1.01,0.06956160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,4096,1536,8,128,2,128,power_law_1.01,0.03700479865074158
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,64,power_law_1.01,0.12664320468902587
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,4,64,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,32,power_law_1.01,0.0593280017375946
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,4096,1536,8,128,2,128,power_law_1.01,0.0380160003900528
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,64,power_law_1.01,0.1444607973098755
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,4,64,power_law_1.2,0.07218559980392455
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,32,power_law_1.01,0.05973759889602661
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,4096,1536,8,128,2,128,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,64,power_law_1.01,0.18602880239486694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,4,64,power_law_1.2,0.07790719866752624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,4096,1536,8,128,2,128,power_law_1.01,0.038438400626182555
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,32,power_law_1.01,0.06505600214004517
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,64,power_law_1.01,0.2151103973388672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,4,64,power_law_1.2,0.08098559975624084
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,4096,1536,8,128,2,128,power_law_1.01,0.038841599225997926
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,32,power_law_1.01,0.06751999855041504
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,4096,1536,8,128,2,128,power_law_1.01,0.04211840033531189
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,4,64,power_law_1.2,0.08734719753265381
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,64,power_law_1.01,0.2972480058670044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,32,power_law_1.01,0.06792960166931153
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,4096,1536,8,128,2,128,power_law_1.01,0.044563201069831845
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,4,64,power_law_1.2,0.09799039959907532
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,64,power_law_1.01,0.35623679161071775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,32,power_law_1.01,0.06793599724769592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,4096,1536,8,128,2,128,power_law_1.01,0.04539520144462585
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,4,64,power_law_1.2,0.1086400032043457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,64,power_law_1.01,0.49855360984802244
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,32,power_law_1.01,0.06995199918746949
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,4096,1536,8,128,2,128,power_law_1.01,0.04663040041923523
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,4,64,power_law_1.2,0.1307584047317505
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,4096,1536,8,128,2,128,power_law_1.01,0.049292799830436704
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,32,power_law_1.01,0.07203840017318726
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,64,power_law_1.01,0.6214464187622071
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,4096,1536,8,128,2,128,power_law_1.01,0.054201602935791016
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,4,64,power_law_1.2,0.15510400533676147
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,32,power_law_1.01,0.07470080256462097
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,64,power_law_1.01,0.7744192123413086
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,4096,1536,8,128,2,128,power_law_1.01,0.06279680132865906
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,4,64,power_law_1.2,0.1930176019668579
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,32,power_law_1.01,0.07694079875946044
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,64,power_law_1.01,1.2546815872192383
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,4,64,power_law_1.2,0.23150720596313476
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,32,power_law_1.01,0.07571840286254883
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,4,64,power_law_1.2,0.31712639331817627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,64,power_law_1.01,2.283180809020996
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,32,power_law_1.01,0.08307200074195861
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,4,64,power_law_1.2,0.3773375988006592
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,32,power_law_1.01,0.08554880023002624
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,32,power_law_1.01,0.0883840024471283
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,4,64,power_law_1.2,0.547711992263794
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,8,32,power_law_1.2,0.07011839747428894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,32,power_law_1.01,0.10008319616317748
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,4,64,power_law_1.2,0.7211775779724121
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,8,32,power_law_1.2,0.07502719759941101
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,32,power_law_1.01,0.10848640203475952
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,4,64,power_law_1.2,0.8526592254638672
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,8,32,power_law_1.2,0.07094399929046631
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,32,power_law_1.01,0.13633279800415038
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,8,32,power_law_1.2,0.05886080265045166
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,4,64,power_law_1.2,1.336620807647705
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,32,power_law_1.01,0.15312639474868775
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,8,32,power_law_1.2,0.06296319961547851
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,4,64,power_law_1.2,2.7253440856933593
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,32,power_law_1.01,0.19571199417114257
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,8,32,power_law_1.2,0.0674560010433197
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,32,power_law_1.01,0.2321727991104126
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,8,32,power_law_1.2,0.06808320283889771
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,32,power_law_1.01,0.3100032091140747
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,8,32,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,16,power_law_1.01,0.07095680236816407
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,32,power_law_1.01,0.37144320011138915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,8,32,power_law_1.2,0.06970880031585694
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,16,power_law_1.01,0.08324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,32,power_law_1.01,0.5325823783874511
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,8,32,power_law_1.2,0.07033600211143494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,16,power_law_1.01,0.08835840225219727
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,32,power_law_1.01,0.6483200073242188
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,8,32,power_law_1.2,0.07236480116844177
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,16,power_law_1.01,0.06276479959487916
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,8,32,power_law_1.2,0.07319679856300354
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,16,power_law_1.01,0.06686080098152161
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,32,power_law_1.01,0.7990592002868653
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,8,32,power_law_1.2,0.07441279888153077
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,16,power_law_1.01,0.07130879759788514
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,32,power_law_1.01,1.289151954650879
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,8,32,power_law_1.2,0.07728639841079712
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,16,power_law_1.01,0.07319039702415467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,32,power_law_1.01,2.5361663818359377
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,16,power_law_1.01,0.07894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,8,32,power_law_1.2,0.08524799942970276
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,8,32,power_law_1.2,0.0852735996246338
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,16,power_law_1.01,0.07955840229988098
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,8,32,power_law_1.2,0.08896639943122864
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,16,power_law_1.01,0.08364800214767457
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1,7168,2048,8,384,16,16,power_law_1.2,0.07447680234909057
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,8,32,power_law_1.2,0.10289280414581299
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,16,power_law_1.01,0.08426880240440368
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2,7168,2048,8,384,16,16,power_law_1.2,0.07878400087356567
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,8,32,power_law_1.2,0.11599359512329102
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,16,power_law_1.01,0.08714240193367004
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4,7168,2048,8,384,16,16,power_law_1.2,0.0763264000415802
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,8,32,power_law_1.2,0.13893120288848876
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,16,power_law_1.01,0.08611199855804444
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8,7168,2048,8,384,16,16,power_law_1.2,0.0617792010307312
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,8,32,power_law_1.2,0.1577664017677307
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,16,power_law_1.01,0.0869055986404419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16,7168,2048,8,384,16,16,power_law_1.2,0.06465280055999756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,8,32,power_law_1.2,0.20365440845489502
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,16,power_law_1.01,0.09285119771957398
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32,7168,2048,8,384,16,16,power_law_1.2,0.06751360297203064
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,8,32,power_law_1.2,0.23969919681549073
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,16,power_law_1.01,0.09512320160865784
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,48,7168,2048,8,384,16,16,power_law_1.2,0.07120640277862549
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,16,power_law_1.01,0.10577919483184814
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,8,32,power_law_1.2,0.3193599939346313
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,64,7168,2048,8,384,16,16,power_law_1.2,0.07489280104637146
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,16,power_law_1.01,0.11949440240859985
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,8,32,power_law_1.2,0.40067200660705565
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,80,7168,2048,8,384,16,16,power_law_1.2,0.07488639950752259
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,16,power_law_1.01,0.12707200050354003
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,96,7168,2048,8,384,16,16,power_law_1.2,0.07775999903678894
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,8,32,power_law_1.2,0.5432064056396484
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,16,power_law_1.01,0.1553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,128,7168,2048,8,384,16,16,power_law_1.2,0.08431360125541687
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,8,32,power_law_1.2,0.7461631774902344
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,16,power_law_1.01,0.17929600477218627
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,160,7168,2048,8,384,16,16,power_law_1.2,0.08184319734573364
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,8,32,power_law_1.2,0.8899392127990723
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,16,power_law_1.01,0.2286463975906372
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,192,7168,2048,8,384,16,16,power_law_1.2,0.082259202003479
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,8,32,power_law_1.2,1.388211154937744
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,256,7168,2048,8,384,16,16,power_law_1.2,0.08574079871177673
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,16,power_law_1.01,0.2605760097503662
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,8,32,power_law_1.2,2.8418815612792967
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,320,7168,2048,8,384,16,16,power_law_1.2,0.0945472002029419
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,16,power_law_1.01,0.3482367992401123
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,384,7168,2048,8,384,16,16,power_law_1.2,0.09679999947547913
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,16,power_law_1.01,0.42934398651123046
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,512,7168,2048,8,384,16,16,power_law_1.2,0.10580480098724365
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,16,power_law_1.01,0.6042175769805909
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,768,7168,2048,8,384,16,16,power_law_1.2,0.11727999448776245
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,16,power_law_1.01,0.7424831867218018
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1024,7168,2048,8,384,16,16,power_law_1.2,0.1338495969772339
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,16,power_law_1.01,0.9280447959899902
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,1536,7168,2048,8,384,16,16,power_law_1.2,0.15783040523529052
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,16,power_law_1.01,1.4471872329711915
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,7168,2048,8,384,16,16,power_law_1.2,0.17933440208435059
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,16,power_law_1.01,2.7800512313842773
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,7168,2048,8,384,16,16,power_law_1.2,0.22992639541625975
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,7168,2048,8,384,16,16,power_law_1.2,0.2735487937927246
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,7168,2048,8,384,16,16,power_law_1.2,0.3665152072906494
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,7168,2048,8,384,16,16,power_law_1.2,0.4596992015838623
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,7168,2048,8,384,16,16,power_law_1.2,0.6321407794952393
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,7168,2048,8,384,16,16,power_law_1.2,0.7970176219940186
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,7168,2048,8,384,16,16,power_law_1.2,1.0021120071411134
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,7168,2048,8,384,16,16,power_law_1.2,1.6976448059082032
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,7168,2048,8,384,16,16,power_law_1.2,3.3602878570556642
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,2048,4096,1536,8,128,2,128,power_law_1.01,0.06792320013046264
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,3072,4096,1536,8,128,2,128,power_law_1.01,0.084307199716568
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,4096,4096,1536,8,128,2,128,power_law_1.01,0.10066560506820679
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,6144,4096,1536,8,128,2,128,power_law_1.01,0.13345919847488402
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,8192,4096,1536,8,128,2,128,power_law_1.01,0.16868480443954467
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,12288,4096,1536,8,128,2,128,power_law_1.01,0.21498239040374756
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,16384,4096,1536,8,128,2,128,power_law_1.01,0.26739840507507323
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,20480,4096,1536,8,128,2,128,power_law_1.01,0.3409152030944824
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,32768,4096,1536,8,128,2,128,power_law_1.01,0.535475206375122
TRTLLM,1.0.0rc6,NVIDIA GB200,moe,moe_torch_flow,nvfp4,65536,4096,1536,8,128,2,128,power_law_1.01,1.0521920204162598
